Publications

3,803 major publications by members of the MERL staff.


  •  Ick, Christopher, Wichern, Gordon, Masuyama, Yoshiki, Germain, François G, Le Roux, Jonathan, "Data Augmentation Using Neural Acoustic Fields With Retrieval-Augmented Pre-training", Tech. Rep. TR2025-045, Mitsubishi Electric Research Laboratories, Cambridge, MA, April 2025.
    BibTeX TR2025-045 PDF
    • @techreport{MERL_TR2025-045,
    • author = {Ick, Christopher; Wichern, Gordon; Masuyama, Yoshiki; Germain, François G; Le Roux, Jonathan},
    • title = {Data Augmentation Using Neural Acoustic Fields With Retrieval-Augmented Pre-training},
    • institution = {MERL - Mitsubishi Electric Research Laboratories},
    • address = {Cambridge, MA 02139},
    • number = {TR2025-045},
    • month = apr,
    • year = 2025,
    • url = {https://www.merl.com/publications/TR2025-045/}
    • }
  •  Lin, C., Boufounos, P.T., Ma, Y., Wang, Y., "Time-optimal single-scalar control on a qubit of unitary dynamics", arXiv, April 2025.
    BibTeX arXiv
    • @article{Lin2025apr,
    • author = {Lin, Chungwei and Boufounos, Petros T. and Ma, Yanting and Wang, Yebin},
    • title = {{Time-optimal single-scalar control on a qubit of unitary dynamics}},
    • journal = {arXiv},
    • year = 2025,
    • month = apr,
    • url = {https://arxiv.org/abs/2504.01785}
    • }
  •  Chakrabarty, A., Vanfretti, L., Wang, Y., Mineyuki, T., Zhan, S., Tang, W.-T., Paulson, J.A., Deshpande, V.M., Bortoff, S.A., Laughman, C.R., "Time-Series Generative Networks for Synthesizing Realistic Scenarios in Occupant-Centric Building Simulation", Building Simulation, April 2025.
    BibTeX TR2025-043 PDF
    • @article{Chakrabarty2025apr,
    • author = {Chakrabarty, Ankush and Vanfretti, Luigi and Wang, Ye and Mineyuki, Takuma and Zhan, Sicheng and Tang, Wei-Ting and Paulson, Joel A. and Deshpande, Vedang M. and Bortoff, Scott A. and Laughman, Christopher R.},
    • title = {{Time-Series Generative Networks for Synthesizing Realistic Scenarios in Occupant-Centric Building Simulation}},
    • journal = {Building Simulation},
    • year = 2025,
    • month = apr,
    • url = {https://www.merl.com/publications/TR2025-043}
    • }
  •  Smedemark-Margulies, N., Wang, Y., Koike-Akino, T., Liu, J., Parsons, K., Bicer, Y., Erdogmus, D., "Improving Subject Transfer in EEG Classification with Divergence Estimation", Journal of Neural Engineering, DOI: 10.1088/​1741-2552/​ad9777, Vol. 21, No. 6, April 2025.
    BibTeX TR2025-044 PDF Software
    • @article{Smedemark-Margulies2025apr,
    • author = {Smedemark-Margulies, Niklas and Wang, Ye and Koike-Akino, Toshiaki and Liu, Jing and Parsons, Kieran and Bicer, Yunus and Erdogmus, Deniz},
    • title = {{Improving Subject Transfer in EEG Classification with Divergence Estimation}},
    • journal = {Journal of Neural Engineering},
    • year = 2025,
    • volume = 21,
    • number = 6,
    • month = apr,
    • doi = {10.1088/1741-2552/ad9777},
    • url = {https://www.merl.com/publications/TR2025-044}
    • }
  •  Wang, J.-W., Nikovski, D.N., "Learning Visual Servoing for Nonholonomic Mobile Robots with Uncalibrated Cameras", The 40th ACM/SIGAPP Symposium On Applied Computing, March 2025.
    BibTeX TR2025-042 PDF
    • @inproceedings{Wang2025mar2,
    • author = {Wang, Jen-Wei and Nikovski, Daniel N.},
    • title = {{Learning Visual Servoing for Nonholonomic Mobile Robots with Uncalibrated Cameras}},
    • booktitle = {The 40th ACM/SIGAPP Symposium On Applied Computing},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-042}
    • }
  •  Dong, Y., Yagyu, E., Matsuda, T., Teo, K.H., Lin, C., Rakheja, S., "An accurate electrical and thermal co-simulation framework for modeling high-temperature DC and pulsed I-V characteristics of GaN HEMTs", IEEE Journal of the Electron Devices Society, March 2025.
    BibTeX TR2025-041 PDF
    • @article{Dong2025mar,
    • author = {Dong, Yicong and Yagyu, Eiji and Matsuda, Takashi and Teo, Koon Hoo and Lin, Chungwei and Rakheja, Shaloo},
    • title = {{An accurate electrical and thermal co-simulation framework for modeling high-temperature DC and pulsed I-V characteristics of GaN HEMTs}},
    • journal = {IEEE Journal of the Electron Devices Society},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-041}
    • }
  •  Das, A., Rahman, S., Xiang, X., Palash, R.H., Hossain, T., Sikder, B., Yagyu, E., Nakamura, M., Teo, K.H., Chowdhury, N., "Inverse Design of AlGaN/GaN HEMT RF Device with Source Connected Field Plate", Advanced Theory and Simulations, March 2025.
    BibTeX TR2025-040 PDF
    • @article{Das2025mar,
    • author = {Das, Aurick and Rahman, Saimur and Xiang, Xiaofeng and Palash, Raffd Hassan and Hossain, Toiyob and Sikder, Bejoy and Yagyu, Eiji and Nakamura, Marika and Teo, Koon Hoo and Chowdhury, Nadim},
    • title = {{Inverse Design of AlGaN/GaN HEMT RF Device with Source Connected Field Plate}},
    • journal = {Advanced Theory and Simulations},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-040}
    • }
  •  Ranade, S., Pais, G., Whitaker, R., Nascimento, J., Miraldo, P., Ramalingam, S., "SurfR: Surface Reconstruction with Multi-scale Attention", International Conference on 3D Vision (3DV), March 2025.
    BibTeX TR2025-039 PDF
    • @inproceedings{Ranade2025mar,
    • author = {Ranade, Siddhant and Pais, Goncalo and Whitaker, Ross and Nascimento, Jacinto and Miraldo, Pedro and Ramalingam, Srikumar},
    • title = {{SurfR: Surface Reconstruction with Multi-scale Attention}},
    • booktitle = {International Conference on 3D Vision (3DV)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-039}
    • }
  •  Shenoy, V., Lohit, S., Mansour, H., Chellappa, R., Marks, T.K., "Recovering Pulse Waves from Video Using Deep Unrolling and Deep Equilibrium Models", arXiv, March 2025.
    BibTeX arXiv
    • @article{Shenoy2025mar,
    • author = {Shenoy, Vineet and Lohit, Suhas and Mansour, Hassan and Chellappa, Rama and Marks, Tim K.},
    • title = {{Recovering Pulse Waves from Video Using Deep Unrolling and Deep Equilibrium Models}},
    • journal = {arXiv},
    • year = 2025,
    • month = mar,
    • url = {https://arxiv.org/abs/2503.17269}
    • }
  •  Shenoy, V., Wu, S., Comas, A., Marks, T.K., Lohit, S., Mansour, H., "Time-Series U-Net with Recurrence for Noise-Robust Imaging Photoplethysmography", arXiv, March 2025.
    BibTeX arXiv
    • @article{Shenoy2025mar2,
    • author = {Shenoy, Vineet and Wu, Shaoju and Comas, Armand and Marks, Tim K. and Lohit, Suhas and Mansour, Hassan},
    • title = {{Time-Series U-Net with Recurrence for Noise-Robust Imaging Photoplethysmography}},
    • journal = {arXiv},
    • year = 2025,
    • month = mar,
    • url = {https://arxiv.org/abs/2503.17351}
    • }
  •  Wilkinghoff, K., Fujimura, T., Imoto, K., Le Roux, J., Tan, Z.-H., Toda, T., "Handling Domain Shifts for Anomalous Sound Detection: A Review of DCASE-Related Work", arXiv, March 2025.
    BibTeX arXiv
    • @article{Wilkinghoff2025mar2,
    • author = {Wilkinghoff, Kevin and Fujimura, Takuya and Imoto, Keisuke and {Le Roux}, Jonathan and Tan, Zheng-Hua and Toda, Tomoki},
    • title = {{Handling Domain Shifts for Anomalous Sound Detection: A Review of DCASE-Related Work}},
    • journal = {arXiv},
    • year = 2025,
    • month = mar,
    • url = {https://arxiv.org/abs/2503.10435}
    • }
  •  Shirai, Y., Raghunathan, A., Jha, D.K., "Hierarchical Contact-Rich Trajectory Optimization for Multi-Modal Manipulation using Tight Convex Relaxations", arXiv, March 2025.
    BibTeX arXiv
    • @article{Shirai2025mar,
    • author = {Shirai, Yuki and Raghunathan, Arvind and Jha, Devesh K.},
    • title = {{Hierarchical Contact-Rich Trajectory Optimization for Multi-Modal Manipulation using Tight Convex Relaxations}},
    • journal = {arXiv},
    • year = 2025,
    • month = mar,
    • url = {https://arxiv.org/abs/2503.07963}
    • }
  •  Schperberg, A., Menner, M., Di Cairano, S., "Energy-Efficient Motion Planner for Legged Robots", arXiv, March 2025.
    BibTeX arXiv
    • @article{Schperberg2025mar,
    • author = {Schperberg, Alexander and Menner, Marcel and {Di Cairano}, Stefano},
    • title = {{Energy-Efficient Motion Planner for Legged Robots}},
    • journal = {arXiv},
    • year = 2025,
    • month = mar,
    • url = {https://arxiv.org/abs/2503.06050}
    • }
  •  Araki, S., Ito, N., Haeb-Umbach, R., Wichern, G., Wang, Z.-Q., Mitsufuji, Y., "30+ Years of Source Separation Research: Achievements and Future Challenges", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2025.
    BibTeX TR2025-036 PDF
    • @inproceedings{Araki2025mar,
    • author = {Araki, Shoko and Ito, Nobutaka and Haeb-Umbach, Reinhold and Wichern, Gordon and Wang, Zhong-Qiu and Mitsufuji, Yuki},
    • title = {{30+ Years of Source Separation Research: Achievements and Future Challenges}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-036}
    • }
  •  Ebbers, J., Germain, F.G., Wilkinghoff, K., Wichern, G., Le Roux, J., "No Class Left Behind: A Closer Look at Class Balancing for Audio Tagging", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2025.
    BibTeX TR2025-037 PDF
    • @inproceedings{Ebbers2025mar,
    • author = {Ebbers, Janek and Germain, François G and Wilkinghoff, Kevin and Wichern, Gordon and {Le Roux}, Jonathan},
    • title = {{No Class Left Behind: A Closer Look at Class Balancing for Audio Tagging}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-037}
    • }
  •  Gruttadauria, E., Fontaine, M., Le Roux, J., Essid, S., "O-EENC-SD: Efficient Online End-to-End Neural Clustering for Speaker Diarization", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2025.
    BibTeX TR2025-031 PDF
    • @inproceedings{Gruttadauria2025mar,
    • author = {Gruttadauria, Elio and Fontaine, Mathieu and {Le Roux}, Jonathan and Essid, Slim},
    • title = {{O-EENC-SD: Efficient Online End-to-End Neural Clustering for Speaker Diarization}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-031}
    • }
  •  Hori, C., Kambara, M., Sugiura, K., Ota, K., Khurana, S., Jain, S., Corcodel, R., Jha, D.K., Romeres, D., Le Roux, J., "Interactive Robot Action Replanning using Multimodal LLM Trained from Human Demonstration Videos", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2025.
    BibTeX TR2025-034 PDF
    • @inproceedings{Hori2025mar,
    • author = {Hori, Chiori and Kambara, Motonari and Sugiura, Komei and Ota, Kei and Khurana, Sameer and Jain, Siddarth and Corcodel, Radu and Jha, Devesh K. and Romeres, Diego and {Le Roux}, Jonathan},
    • title = {{Interactive Robot Action Replanning using Multimodal LLM Trained from Human Demonstration Videos}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-034}
    • }
  •  Kitichotkul, R., Rapp, J., Ma, Y., Mansour, H., "Doppler Single-Photon Lidar", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2025.
    BibTeX TR2025-028 PDF
    • @inproceedings{Kitichotkul2025mar,
    • author = {Kitichotkul, Ruangrawee and Rapp, Joshua and Ma, Yanting and Mansour, Hassan},
    • title = {{Doppler Single-Photon Lidar}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-028}
    • }
  •  Masuyama, Y., Wichern, G., Germain, F.G., Ick, C., Le Roux, J., "Retrieval-Augmented Neural Field for HRTF Upsampling and Personalization", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2025.
    BibTeX TR2025-029 PDF Software
    • @inproceedings{Masuyama2025mar,
    • author = {Masuyama, Yoshiki and Wichern, Gordon and Germain, François G and Ick, Christopher and {Le Roux}, Jonathan},
    • title = {{Retrieval-Augmented Neural Field for HRTF Upsampling and Personalization}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-029}
    • }
  •  Saijo, K., Ebbers, J., Germain, F.G., Khurana, S., Wichern, G., Le Roux, J., "Leveraging Audio-Only Data for Text-Queried Target Sound Extraction", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2025.
    BibTeX TR2025-033 PDF
    • @inproceedings{Saijo2025mar2,
    • author = {Saijo, Kohei and Ebbers, Janek and Germain, François G and Khurana, Sameer and Wichern, Gordon and {Le Roux}, Jonathan},
    • title = {{Leveraging Audio-Only Data for Text-Queried Target Sound Extraction}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-033}
    • }
  •  Saijo, K., Ebbers, J., Germain, F.G., Wichern, G., Le Roux, J., "Task-Aware Unified Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2025.
    BibTeX TR2025-032 PDF
    • @inproceedings{Saijo2025mar,
    • author = {Saijo, Kohei and Ebbers, Janek and Germain, François G and Wichern, Gordon and {Le Roux}, Jonathan},
    • title = {{Task-Aware Unified Source Separation}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-032}
    • }
  •  Teh, A., Ali, W.H., Rapp, J., Mansour, H., "Indoor Airflow Imaging Using Physics-Informed Schlieren Tomography", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2025.
    BibTeX TR2025-035 PDF
    • @inproceedings{Teh2025mar,
    • author = {Teh, Arjun and Ali, Wael H. and Rapp, Joshua and Mansour, Hassan},
    • title = {{Indoor Airflow Imaging Using Physics-Informed Schlieren Tomography}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-035}
    • }
  •  Wilkinghoff, K., Yang, H., Ebbers, J., Germain, F.G., Wichern, G., Le Roux, J., "Keeping the Balance: Anomaly Score Calculation for Domain Generalization", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), March 2025.
    BibTeX TR2025-030 PDF
    • @inproceedings{Wilkinghoff2025mar,
    • author = {Wilkinghoff, Kevin and Yang, Haici and Ebbers, Janek and Germain, François G and Wichern, Gordon and {Le Roux}, Jonathan},
    • title = {{Keeping the Balance: Anomaly Score Calculation for Domain Generalization}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-030}
    • }
  •  Tian, J., Shi, J., Chen, W., Arora, S., Masuyama, Y., Takashi, M., Wu, Y., Peng, J., Bharadwaj, S., Zhao, Y., Cornell, S., Peng, Y., Yue, X., Yang, C.-H.H., Neubig, G., Watanabe, S., "ESPnet-SpeechLM: An Open Speech Language Model Toolkit", NAACL-HLT (the system demonstration track), March 2025.
    BibTeX TR2025-038 PDF
    • @inproceedings{Tian2025mar,
    • author = {Tian, Jinchuan and Shi, Jiatong and Chen, William and Arora, Siddhant and Masuyama, Yoshiki and Takashi, Maekaku and Wu, Yihan and Peng, Junyi and Bharadwaj, Shikhar and Zhao, Yiwen and Cornell, Samuele and Peng, Yifan and Yue, Xiang and Yang, Chao-Han H. and Neubig, Graham and Watanabe, Shinji},
    • title = {{ESPnet-SpeechLM: An Open Speech Language Model Toolkit}},
    • booktitle = {NAACL-HLT (the system demonstration track)},
    • year = 2025,
    • month = mar,
    • url = {https://www.merl.com/publications/TR2025-038}
    • }
  •  Koike-Akino, T., Tonin, F., Wu, Y., Wu, F.Z., Candogan, L.N., Volkan Cevher,, "Quantum-PEFT: Ultra parameter-efficient fine-tuning", arXiv, March 2025.
    BibTeX arXiv
    • @article{Koike-Akino2025mar,
    • author = {Koike-Akino, Toshiaki and Tonin, Francesco and Wu, Yongtao and Wu, Frank Zhengqing and Candogan, Leyla Naz and Volkan Cevher},
    • title = {{Quantum-PEFT: Ultra parameter-efficient fine-tuning}},
    • journal = {arXiv},
    • year = 2025,
    • month = mar,
    • url = {https://arxiv.org/abs/2503.05431}
    • }