Publications

3,826 major publications by members of the MERL staff.


  •  Ebbers, J., Germain, F.G., Wilkinghoff, K., Wichern, G., Le Roux, J., "No Class Left Behind: A Closer Look at Class Balancing for Audio Tagging", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49660.2025.10890706, April 2025.
    BibTeX TR2025-037 PDF
    • @inproceedings{Ebbers2025mar,
    • author = {Ebbers, Janek and Germain, François G and Wilkinghoff, Kevin and Wichern, Gordon and {Le Roux}, Jonathan},
    • title = {{No Class Left Behind: A Closer Look at Class Balancing for Audio Tagging}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • doi = {10.1109/ICASSP49660.2025.10890706},
    • url = {https://www.merl.com/publications/TR2025-037}
    • }
  •  Gruttadauria, E., Fontaine, M., Le Roux, J., Essid, S., "O-EENC-SD: Efficient Online End-to-End Neural Clustering for Speaker Diarization", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49660.2025.10890837, April 2025.
    BibTeX TR2025-031 PDF
    • @inproceedings{Gruttadauria2025mar,
    • author = {Gruttadauria, Elio and Fontaine, Mathieu and {Le Roux}, Jonathan and Essid, Slim},
    • title = {{{O-EENC-SD}: Efficient Online End-to-End Neural Clustering for Speaker Diarization}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • doi = {10.1109/ICASSP49660.2025.10890837},
    • url = {https://www.merl.com/publications/TR2025-031}
    • }
  •  Hori, C., Kambara, M., Sugiura, K., Ota, K., Khurana, S., Jain, S., Corcodel, R., Jha, D.K., Romeres, D., Le Roux, J., "Interactive Robot Action Replanning using Multimodal LLM Trained from Human Demonstration Videos", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49660.2025.10887717, April 2025.
    BibTeX TR2025-034 PDF
    • @inproceedings{Hori2025mar,
    • author = {Hori, Chiori and Kambara, Motonari and Sugiura, Komei and Ota, Kei and Khurana, Sameer and Jain, Siddarth and Corcodel, Radu and Jha, Devesh K. and Romeres, Diego and {Le Roux}, Jonathan},
    • title = {{Interactive Robot Action Replanning using Multimodal {LLM} Trained from Human Demonstration Videos}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • doi = {10.1109/ICASSP49660.2025.10887717},
    • url = {https://www.merl.com/publications/TR2025-034}
    • }
  •  Kitichotkul, R., Rapp, J., Ma, Y., Mansour, H., "Doppler Single-Photon Lidar", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49660.2025.10888897, April 2025, pp. 1-5.
    BibTeX TR2025-028 PDF
    • @inproceedings{Kitichotkul2025mar,
    • author = {Kitichotkul, Ruangrawee and Rapp, Joshua and Ma, Yanting and Mansour, Hassan},
    • title = {{Doppler Single-Photon Lidar}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • pages = {1--5},
    • month = mar,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP49660.2025.10888897},
    • url = {https://www.merl.com/publications/TR2025-028}
    • }
  •  Masuyama, Y., Wichern, G., Germain, F.G., Ick, C., Le Roux, J., "Retrieval-Augmented Neural Field for HRTF Upsampling and Personalization", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49660.2025.10889481, April 2025.
    BibTeX TR2025-029 PDF Software
    • @inproceedings{Masuyama2025mar,
    • author = {Masuyama, Yoshiki and Wichern, Gordon and Germain, François G and Ick, Christopher and {Le Roux}, Jonathan},
    • title = {{Retrieval-Augmented Neural Field for HRTF Upsampling and Personalization}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • doi = {10.1109/ICASSP49660.2025.10889481},
    • url = {https://www.merl.com/publications/TR2025-029}
    • }
  •  Saijo, K., Ebbers, J., Germain, F.G., Khurana, S., Wichern, G., Le Roux, J., "Leveraging Audio-Only Data for Text-Queried Target Sound Extraction", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49660.2025.10888769, April 2025.
    BibTeX TR2025-033 PDF
    • @inproceedings{Saijo2025mar2,
    • author = {Saijo, Kohei and Ebbers, Janek and Germain, François G and Khurana, Sameer and Wichern, Gordon and {Le Roux}, Jonathan},
    • title = {{Leveraging Audio-Only Data for Text-Queried Target Sound Extraction}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • doi = {10.1109/ICASSP49660.2025.10888769},
    • url = {https://www.merl.com/publications/TR2025-033}
    • }
  •  Saijo, K., Ebbers, J., Germain, F.G., Wichern, G., Le Roux, J., "Task-Aware Unified Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49660.2025.10887819, April 2025.
    BibTeX TR2025-032 PDF
    • @inproceedings{Saijo2025mar,
    • author = {Saijo, Kohei and Ebbers, Janek and Germain, François G and Wichern, Gordon and {Le Roux}, Jonathan},
    • title = {{Task-Aware Unified Source Separation}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • doi = {10.1109/ICASSP49660.2025.10887819},
    • url = {https://www.merl.com/publications/TR2025-032}
    • }
  •  Teh, A., Ali, W.H., Rapp, J., Mansour, H., "Indoor Airflow Imaging Using Physics-Informed Schlieren Tomography", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49660.2025.10889412, April 2025, pp. 1-5.
    BibTeX TR2025-035 PDF
    • @inproceedings{Teh2025mar,
    • author = {Teh, Arjun and Ali, Wael H. and Rapp, Joshua and Mansour, Hassan},
    • title = {{Indoor Airflow Imaging Using Physics-Informed Schlieren Tomography}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • pages = {1--5},
    • month = mar,
    • doi = {10.1109/ICASSP49660.2025.10889412},
    • url = {https://www.merl.com/publications/TR2025-035}
    • }
  •  Wilkinghoff, K., Yang, H., Ebbers, J., Germain, F.G., Wichern, G., Le Roux, J., "Keeping the Balance: Anomaly Score Calculation for Domain Generalization", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP49660.2025.10888402, April 2025.
    BibTeX TR2025-030 PDF
    • @inproceedings{Wilkinghoff2025mar,
    • author = {Wilkinghoff, Kevin and Yang, Haici and Ebbers, Janek and Germain, François G and Wichern, Gordon and {Le Roux}, Jonathan},
    • title = {{Keeping the Balance: Anomaly Score Calculation for Domain Generalization}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • doi = {10.1109/ICASSP49660.2025.10888402},
    • url = {https://www.merl.com/publications/TR2025-030}
    • }
  •  Yataka, R., Wang, P., Boufounos, P.T., Takahashi, R., "Multi-View Radar Detection Transformer with Differentiable Positional Encoding", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), April 2025.
    BibTeX TR2025-027 PDF
    • @inproceedings{Yataka2025mar,
    • author = {Yataka, Ryoma and Wang, Pu and Boufounos, Petros T. and Takahashi, Ryuhei},
    • title = {{Multi-View Radar Detection Transformer with Differentiable Positional Encoding}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-027}
    • }
  •  Hu, Y., Lohit, S., Kamilov, U., Marks, T.K., "Multimodal Diffusion Bridge with Attention-Based SAR Fusion for Satellite Image Cloud Removal", arXiv, April 2025.
    BibTeX arXiv
    • @article{Hu2025apr,
    • author = {Hu, Yuyang and Lohit, Suhas and Kamilov, Ulugbek and Marks, Tim K.},
    • title = {{Multimodal Diffusion Bridge with Attention-Based SAR Fusion for Satellite Image Cloud Removal}},
    • journal = {arXiv},
    • year = 2025,
    • month = apr,
    • url = {https://arxiv.org/abs/2504.03607}
    • }
  •  Li, K., Zhang, T., Peng, K.-C., Wang, G., "PF3Det: A Prompted Foundation Feature Assisted Visual LiDAR 3D Detector", arXiv, April 2025.
    BibTeX arXiv
    • @article{Li2025apr,
    • author = {Li, Kaidong and Zhang, Tianxiao and Peng, Kuan-Chuan and Wang, Guanghui},
    • title = {{PF3Det: A Prompted Foundation Feature Assisted Visual LiDAR 3D Detector}},
    • journal = {arXiv},
    • year = 2025,
    • month = apr,
    • url = {https://arxiv.org/abs/2504.03563}
    • }
  •  Ghezzi, A., Nurkanovic ́, A., Weiss, A., Diehl, M., Di Cairano, S., "A Comparative Study of MINLP and MPVC Formulations for Solving Complex Nonlinear Decision-Making Problems in Aerospace Applications", arXiv, April 2025.
    BibTeX arXiv
    • @article{Ghezzi2025apr,
    • author = {Ghezzi, Andrea and Nurkanovic ́, Armin and Weiss, Avishai and Diehl, Moritz and {Di Cairano}, Stefano},
    • title = {{A Comparative Study of MINLP and MPVC Formulations for Solving Complex Nonlinear Decision-Making Problems in Aerospace Applications}},
    • journal = {arXiv},
    • year = 2025,
    • month = apr,
    • url = {https://arxiv.org/abs/2504.02375}
    • }
  •  Jung, Y.G., Park, J., Yoon, J., Peng, K.-C., Kim, W., Teoh, A.B.J., Camps, O., "TailedCore: Few-Shot Sampling for Unsupervised Long-Tail Noisy Anomaly Detection", arXiv, April 2025.
    BibTeX arXiv
    • @article{Jung2025apr,
    • author = {Jung, Yoon G. and Park, Jaewoo and Yoon, Jaeho and Peng, Kuan-Chuan and Kim, Wonchul and Teoh, Andrew B. J. and Camps, Octavia},
    • title = {{TailedCore: Few-Shot Sampling for Unsupervised Long-Tail Noisy Anomaly Detection}},
    • journal = {arXiv},
    • year = 2025,
    • month = apr,
    • url = {https://arxiv.org/abs/2504.02775}
    • }
  •  Lin, C., Boufounos, P.T., Ma, Y., Wang, Y., "Time-optimal single-scalar control on a qubit of unitary dynamics", arXiv, April 2025.
    BibTeX arXiv
    • @article{Lin2025apr,
    • author = {Lin, Chungwei and Boufounos, Petros T. and Ma, Yanting and Wang, Yebin},
    • title = {{Time-optimal single-scalar control on a qubit of unitary dynamics}},
    • journal = {arXiv},
    • year = 2025,
    • month = apr,
    • url = {https://arxiv.org/abs/2504.01785}
    • }
  •  Chakrabarty, A., Vanfretti, L., Wang, Y., Mineyuki, T., Zhan, S., Tang, W.-T., Paulson, J.A., Deshpande, V.M., Bortoff, S.A., Laughman, C.R., "Time-Series Generative Networks for Synthesizing Realistic Scenarios in Occupant-Centric Building Simulation", Building Simulation, April 2025.
    BibTeX TR2025-043 PDF
    • @article{Chakrabarty2025apr,
    • author = {Chakrabarty, Ankush and Vanfretti, Luigi and Wang, Ye and Mineyuki, Takuma and Zhan, Sicheng and Tang, Wei-Ting and Paulson, Joel A. and Deshpande, Vedang M. and Bortoff, Scott A. and Laughman, Christopher R.},
    • title = {{Time-Series Generative Networks for Synthesizing Realistic Scenarios in Occupant-Centric Building Simulation}},
    • journal = {Building Simulation},
    • year = 2025,
    • month = apr,
    • url = {https://www.merl.com/publications/TR2025-043}
    • }
  •  Ick, C., Wichern, G., Masuyama, Y., Germain, F.G., Le Roux, J., "Data Augmentation Using Neural Acoustic Fields With Retrieval-Augmented Pre-training", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP) Satellite Workshop on Generative Data Augmentation for Real-World Signal Processing Applications (GenDA), April 2025.
    BibTeX TR2025-045 PDF
    • @inproceedings{Ick2025apr,
    • author = {Ick, Christopher and Wichern, Gordon and Masuyama, Yoshiki and Germain, François G and {Le Roux}, Jonathan},
    • title = {{Data Augmentation Using Neural Acoustic Fields With Retrieval-Augmented Pre-training}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP) Satellite Workshop on Generative Data Augmentation for Real-World Signal Processing Applications (GenDA)},
    • year = 2025,
    • month = apr,
    • url = {https://www.merl.com/publications/TR2025-045}
    • }
  •  Smedemark-Margulies, N., Wang, Y., Koike-Akino, T., Liu, J., Parsons, K., Bicer, Y., Erdogmus, D., "Improving Subject Transfer in EEG Classification with Divergence Estimation", Journal of Neural Engineering, DOI: 10.1088/​1741-2552/​ad9777, Vol. 21, No. 6, April 2025.
    BibTeX TR2025-044 PDF Software
    • @article{Smedemark-Margulies2025apr,
    • author = {Smedemark-Margulies, Niklas and Wang, Ye and Koike-Akino, Toshiaki and Liu, Jing and Parsons, Kieran and Bicer, Yunus and Erdogmus, Deniz},
    • title = {{Improving Subject Transfer in EEG Classification with Divergence Estimation}},
    • journal = {Journal of Neural Engineering},
    • year = 2025,
    • volume = 21,
    • number = 6,
    • month = apr,
    • doi = {10.1088/1741-2552/ad9777},
    • url = {https://www.merl.com/publications/TR2025-044}
    • }
  •  Wang, J.-W., Nikovski, D.N., "Learning Visual Servoing for Nonholonomic Mobile Robots with Uncalibrated Cameras", The 40th ACM/SIGAPP Symposium On Applied Computing, March 2025.
    BibTeX TR2025-042 PDF
    • @inproceedings{Wang2025mar2,
    • author = {Wang, Jen-Wei and Nikovski, Daniel N.},
    • title = {{Learning Visual Servoing for Nonholonomic Mobile Robots with Uncalibrated Cameras}},
    • booktitle = {The 40th ACM/SIGAPP Symposium On Applied Computing},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-042}
    • }
  •  Dong, Y., Yagyu, E., Matsuda, T., Teo, K.H., Lin, C., Rakheja, S., "An accurate electrical and thermal co-simulation framework for modeling high-temperature DC and pulsed I-V characteristics of GaN HEMTs", IEEE Journal of the Electron Devices Society, March 2025.
    BibTeX TR2025-041 PDF
    • @article{Dong2025mar,
    • author = {Dong, Yicong and Yagyu, Eiji and Matsuda, Takashi and Teo, Koon Hoo and Lin, Chungwei and Rakheja, Shaloo},
    • title = {{An accurate electrical and thermal co-simulation framework for modeling high-temperature DC and pulsed I-V characteristics of GaN HEMTs}},
    • journal = {IEEE Journal of the Electron Devices Society},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-041}
    • }
  •  Das, A., Rahman, S., Xiang, X., Palash, R.H., Hossain, T., Sikder, B., Yagyu, E., Nakamura, M., Teo, K.H., Chowdhury, N., "Inverse Design of AlGaN/GaN HEMT RF Device with Source Connected Field Plate", Advanced Theory and Simulations, March 2025.
    BibTeX TR2025-040 PDF
    • @article{Das2025mar,
    • author = {Das, Aurick and Rahman, Saimur and Xiang, Xiaofeng and Palash, Raffd Hassan and Hossain, Toiyob and Sikder, Bejoy and Yagyu, Eiji and Nakamura, Marika and Teo, Koon Hoo and Chowdhury, Nadim},
    • title = {{Inverse Design of AlGaN/GaN HEMT RF Device with Source Connected Field Plate}},
    • journal = {Advanced Theory and Simulations},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-040}
    • }
  •  Ranade, S., Pais, G., Whitaker, R., Nascimento, J., Miraldo, P., Ramalingam, S., "SurfR: Surface Reconstruction with Multi-scale Attention", International Conference on 3D Vision (3DV), March 2025.
    BibTeX TR2025-039 PDF Presentation
    • @inproceedings{Ranade2025mar,
    • author = {{{Ranade, Siddhant and Pais, Goncalo and Whitaker, Ross and Nascimento, Jacinto and Miraldo, Pedro and Ramalingam, Srikumar}}},
    • title = {{{SurfR: Surface Reconstruction with Multi-scale Attention}}},
    • booktitle = {International Conference on 3D Vision (3DV)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-039}
    • }
  •  Shenoy, V., Lohit, S., Mansour, H., Chellappa, R., Marks, T.K., "Recovering Pulse Waves from Video Using Deep Unrolling and Deep Equilibrium Models", arXiv, March 2025.
    BibTeX arXiv
    • @article{Shenoy2025mar,
    • author = {Shenoy, Vineet and Lohit, Suhas and Mansour, Hassan and Chellappa, Rama and Marks, Tim K.},
    • title = {{Recovering Pulse Waves from Video Using Deep Unrolling and Deep Equilibrium Models}},
    • journal = {arXiv},
    • year = 2025,
    • month = mar,
    • url = {https://arxiv.org/abs/2503.17269}
    • }
  •  Shenoy, V., Wu, S., Comas, A., Marks, T.K., Lohit, S., Mansour, H., "Time-Series U-Net with Recurrence for Noise-Robust Imaging Photoplethysmography", arXiv, March 2025.
    BibTeX arXiv
    • @article{Shenoy2025mar2,
    • author = {Shenoy, Vineet and Wu, Shaoju and Comas, Armand and Marks, Tim K. and Lohit, Suhas and Mansour, Hassan},
    • title = {{Time-Series U-Net with Recurrence for Noise-Robust Imaging Photoplethysmography}},
    • journal = {arXiv},
    • year = 2025,
    • month = mar,
    • url = {https://arxiv.org/abs/2503.17351}
    • }
  •  Wilkinghoff, K., Fujimura, T., Imoto, K., Le Roux, J., Tan, Z.-H., Toda, T., "Handling Domain Shifts for Anomalous Sound Detection: A Review of DCASE-Related Work", arXiv, March 2025.
    BibTeX arXiv
    • @article{Wilkinghoff2025mar2,
    • author = {Wilkinghoff, Kevin and Fujimura, Takuya and Imoto, Keisuke and {Le Roux}, Jonathan and Tan, Zheng-Hua and Toda, Tomoki},
    • title = {{Handling Domain Shifts for Anomalous Sound Detection: A Review of DCASE-Related Work}},
    • journal = {arXiv},
    • year = 2025,
    • month = mar,
    • url = {https://arxiv.org/abs/2503.10435}
    • }