Publications

264 / 3,793 publications found.


  •  Bralios, D., Wichern, G., Germain, F.G., Pan, Z., Khurana, S., Hori, C., Le Roux, J., "Generation or Replication: Auscultating Audio Latent Diffusion Models", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP48485.2024.10447705, March 2024, pp. 1156-1160.
    BibTeX TR2024-027 PDF
    • @inproceedings{Bralios2024mar,
    • author = {Bralios, Dimitrios and Wichern, Gordon and Germain, François G and Pan, Zexu and Khurana, Sameer and Hori, Chiori and {Le Roux}, Jonathan},
    • title = {{Generation or Replication: Auscultating Audio Latent Diffusion Models}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2024,
    • pages = {1156--1160},
    • month = mar,
    • doi = {10.1109/ICASSP48485.2024.10447705},
    • url = {https://www.merl.com/publications/TR2024-027}
    • }
  •  Wu, S.-L., Chang, X., Wichern, G., Jung, J.-W., Germain, F.G., Le Roux, J., Watanabe, S., "Improving Audio Captioning Models with Fine-grained Audio Features, Text Embedding Supervision, and LLM Mix-up Augmentation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP48485.2024.10447215, March 2024, pp. 316-320.
    BibTeX TR2024-028 PDF
    • @inproceedings{Wu2024mar,
    • author = {Wu, Shih-Lun and Chang, Xuankai and Wichern, Gordon and Jung, Jee-weon and Germain, François G and {Le Roux}, Jonathan and Watanabe, Shinji},
    • title = {{Improving Audio Captioning Models with Fine-grained Audio Features, Text Embedding Supervision, and LLM Mix-up Augmentation}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2024,
    • pages = {316--320},
    • month = mar,
    • doi = {10.1109/ICASSP48485.2024.10447215},
    • url = {https://www.merl.com/publications/TR2024-028}
    • }
  •  Baoueb, T., Liu, H., Fontaine, M., Le Roux, J., Richard, G., "SpecDiff-GAN: A Spectrally-Shaped Noise Diffusion GAN for Speech and Music Synthesis", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP48485.2024.10446830, March 2024, pp. 986-990.
    BibTeX TR2024-013 PDF
    • @inproceedings{Baoueb2024mar,
    • author = {Baoueb, Teysir and Liu, Haocheng and Fontaine, Mathieu and {Le Roux}, Jonathan and Richard, Gaël},
    • title = {{SpecDiff-GAN: A Spectrally-Shaped Noise Diffusion GAN for Speech and Music Synthesis}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2024,
    • pages = {986--990},
    • month = mar,
    • doi = {10.1109/ICASSP48485.2024.10446830},
    • issn = {2379-190X},
    • isbn = {979-8-3503-4485-1},
    • url = {https://www.merl.com/publications/TR2024-013}
    • }
  •  Hori, C., Wang, P., Rahman, M., Vaca-Rubio, C., Khurana, S., Cherian, A., Le Roux, J., "Wi-Fi based Indoor Monitoring Enhanced by Multimodal Fusion", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP48485.2024.10447600, March 2024, pp. 13296-13300.
    BibTeX TR2024-012 PDF
    • @inproceedings{Hori2024mar,
    • author = {Hori, Chiori and Wang, Pu and Rahman, Mahbub and Vaca-Rubio, Cristian and Khurana, Sameer and Cherian, Anoop and {Le Roux}, Jonathan},
    • title = {{Wi-Fi based Indoor Monitoring Enhanced by Multimodal Fusion}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2024,
    • pages = {13296--13300},
    • month = mar,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP48485.2024.10447600},
    • issn = {2379-190X},
    • isbn = {979-8-3503-4485-1},
    • url = {https://www.merl.com/publications/TR2024-012}
    • }
  •  Liu, H., Baoueb, T., Fontaine, M., Le Roux, J., Richard, G., "GLA-Grad: A Griffin-Lim Extended Waveform Generation Diffusion Model", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP48485.2024.10446058, March 2024, pp. 11611-11615.
    BibTeX TR2024-014 PDF
    • @inproceedings{Liu2024mar,
    • author = {Liu, Haocheng and Baoueb, Teysir and Fontaine, Mathieu and {Le Roux}, Jonathan and Richard, Gaël},
    • title = {{GLA-Grad: A Griffin-Lim Extended Waveform Generation Diffusion Model}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2024,
    • pages = {11611--11615},
    • month = mar,
    • doi = {10.1109/ICASSP48485.2024.10446058},
    • issn = {2379-190X},
    • isbn = {979-8-3503-4485-1},
    • url = {https://www.merl.com/publications/TR2024-014}
    • }
  •  Bortoff, S.A., Eisenhower, B., Adetola, V., O'Neil, Z., "Control Challenges and Opportunities in Building Automation" in The Impact of Automatic Control Research on Industrial Innovation: Enabling a Sustainable Future, February 2024.
    BibTeX TR2024-011 PDF
    • @incollection{Bortoff2024feb,
    • author = {Bortoff, Scott A. and Eisenhower, Bryan and Adetola, Veronica and O'Neil, Zheng},
    • title = {{Control Challenges and Opportunities in Building Automation}},
    • booktitle = {The Impact of Automatic Control Research on Industrial Innovation: Enabling a Sustainable Future},
    • year = 2024,
    • month = feb,
    • url = {https://www.merl.com/publications/TR2024-011}
    • }
  •  Liu, X., Paul, S., Chatterjee, M., Cherian, A., "CAVEN: An Embodied Conversational Agent for Efficient Audio-Visual Navigation in Noisy Environments", AAAI Conference on Artificial Intelligence, DOI: 10.1609/​aaai.v38i4.28167, December 2023, pp. 3765-3773.
    BibTeX TR2023-154 PDF
    • @inproceedings{Liu2023dec2,
    • author = {Liu, Xiulong and Paul, Sudipta and Chatterjee, Moitreya and Cherian, Anoop},
    • title = {{CAVEN: An Embodied Conversational Agent for Efficient Audio-Visual Navigation in Noisy Environments}},
    • booktitle = {Proceedings of the 38th AAAI Conference on Artificial Intelligence},
    • year = 2023,
    • pages = {3765--3773},
    • month = dec,
    • doi = {10.1609/aaai.v38i4.28167},
    • url = {https://www.merl.com/publications/TR2023-154}
    • }
  •  Liu, J., Koike-Akino, T., Wang, P., Brand, M., Wang, Y., Parsons, K., "LoDA: Low-Dimensional Adaptation of Large Language Models", Advances in Neural Information Processing Systems (NeurIPS) workshop, December 2023.
    BibTeX TR2023-150 PDF
    • @inproceedings{Liu2023dec,
    • author = {Liu, Jing and Koike-Akino, Toshiaki and Wang, Pu and Brand, Matthew and Wang, Ye and Parsons, Kieran},
    • title = {{LoDA: Low-Dimensional Adaptation of Large Language Models}},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS) workshop},
    • year = 2023,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2023-150}
    • }
  •  Kong, C., Yerazunis, W.S., Nikovski, D., "Stochastic Learning Manipulation of Object Pose With Under-Actuated Impulse Generator Arrays", International Conference on Machine Learning and Applications (ICMLA), DOI: 10.1109/​ICMLA58977.2023.00024, December 2023, pp. 112-119.
    BibTeX TR2023-151 PDF
    • @inproceedings{Kong2023dec,
    • author = {Kong, Chuizheng and Yerazunis, William S. and Nikovski, Daniel},
    • title = {{Stochastic Learning Manipulation of Object Pose With Under-Actuated Impulse Generator Arrays}},
    • booktitle = {International Conference on Machine Learning and Applications (ICMLA)},
    • year = 2023,
    • pages = {112--119},
    • month = dec,
    • doi = {10.1109/ICMLA58977.2023.00024},
    • url = {https://www.merl.com/publications/TR2023-151}
    • }
  •  Sun, L., Jha, D.K., Hori, C., Jain, S., Corcodel, R., Zhu, X., Tomizuka, M., Romeres, D., "Interactive Planning Using Large Language Models for Partially Observable Robotics Tasks", Advances in Neural Information Processing Systems (NeurIPS) Workshop on Instruction Tuning and Instruction Following, December 2023.
    BibTeX TR2023-148 PDF Video
    • @inproceedings{Sun2023dec,
    • author = {Sun, Lingfeng and Jha, Devesh K. and Hori, Chiori and Jain, Siddarth and Corcodel, Radu and Zhu, Xinghao and Tomizuka, Masayoshi and Romeres, Diego},
    • title = {{Interactive Planning Using Large Language Models for Partially Observable Robotics Tasks}},
    • booktitle = {Advances in Neural Information Processing Systems (NeurIPS) Workshop on Instruction Tuning and Instruction Following},
    • year = 2023,
    • month = dec,
    • url = {https://www.merl.com/publications/TR2023-148}
    • }
  •  Zhou, A., Sun, H., Kitamura, S., Nikovski, D., "A Decision-Dependent Chance-Constrained Planning Model for Distribution Networks Under Extreme Weather Events", IEEE PES Innovative Smart Grid Technologies Europe (ISGT-Europe), DOI: 10.1109/​ISGTEUROPE56780.2023.10408310, October 2023.
    BibTeX TR2023-133 PDF
    • @inproceedings{Zhou2023oct,
    • author = {Zhou, Anping and Sun, Hongbo and Kitamura, Shoichi and Nikovski, Daniel},
    • title = {{A Decision-Dependent Chance-Constrained Planning Model for Distribution Networks Under Extreme Weather Events}},
    • booktitle = {IEEE PES Innovative Smart Grid Technologies Europe (ISGT-Europe)},
    • year = 2023,
    • month = oct,
    • doi = {10.1109/ISGTEUROPE56780.2023.10408310},
    • url = {https://www.merl.com/publications/TR2023-133}
    • }
  •  Nair, N.G., Cherian, A., Lohit, S., Wang, Y., Koike-Akino, T., Patel, V.M., Marks, T.K., "Steered Diffusion: A Generalized Framework for Plug-and-Play Conditional Image Synthesis", IEEE International Conference on Computer Vision (ICCV), October 2023, pp. 20850-20860.
    BibTeX TR2023-126 PDF Software Presentation
    • @inproceedings{Nair2023sep,
    • author = {Nair, Nithin Gopalakrishnan and Cherian, Anoop and Lohit, Suhas and Wang, Ye and Koike-Akino, Toshiaki and Patel, Vishal M. and Marks, Tim K.},
    • title = {{Steered Diffusion: A Generalized Framework for Plug-and-Play Conditional Image Synthesis}},
    • booktitle = {Proceedings of the IEEE/CVF International Conference on Computer Vision},
    • year = 2023,
    • pages = {20850--20860},
    • month = oct,
    • publisher = {IEEE/CVF},
    • url = {https://www.merl.com/publications/TR2023-126}
    • }
  •  Wang, B., Zhang, S., Inoue, H., Kanemaru, M., "Semi-Supervised Machine Learning for Motor Eccentricity Fault Diagnosis", Asia Pacific Conference of the Prognostics and Health Management Society, DOI: 10.36001/​phmap.2023.v4i1.3644, September 2023.
    BibTeX TR2023-117 PDF
    • @inproceedings{Wang2023sep,
    • author = {Wang, Bingnan and Zhang, Shen and Inoue, Hiroshi and Kanemaru, Makoto},
    • title = {{Semi-Supervised Machine Learning for Motor Eccentricity Fault Diagnosis}},
    • booktitle = {Asia Pacific Conference of the Prognostics and Health Management Society},
    • year = 2023,
    • month = sep,
    • publisher = {PHM Society},
    • doi = {10.36001/phmap.2023.v4i1.3644},
    • url = {https://www.merl.com/publications/TR2023-117}
    • }
  •  Zhan, S., Chakrabarty, A., Laughman, C.R., Chong, A., "A Virtual Testbed for Robust and Reproducible Calibration of Building Energy Simulation Models", IBPSA Building Simulation Conference, DOI: 10.26868/​25222708.2023.1482, September 2023.
    BibTeX TR2023-114 PDF
    • @inproceedings{Zhan2023sep,
    • author = {Zhan, Sicheng and Chakrabarty, Ankush and Laughman, Christopher R. and Chong, Adrian},
    • title = {{A Virtual Testbed for Robust and Reproducible Calibration of Building Energy Simulation Models}},
    • booktitle = {IBPSA Building Simulation Conference},
    • year = 2023,
    • month = sep,
    • doi = {10.26868/25222708.2023.1482},
    • url = {https://www.merl.com/publications/TR2023-114}
    • }
  •  Hori, C., Peng, P., Harwath, D., Liu, X., Ota, K., Jain, S., Corcodel, R., Jha, D.K., Romeres, D., Le Roux, J., "Style-transfer based Speech and Audio-visual Scene understanding for Robot Action Sequence Acquisition from Videos", Interspeech, DOI: 10.21437/​Interspeech.2023-1983, August 2023, pp. 4663-4667.
    BibTeX TR2023-104 PDF
    • @inproceedings{Hori2023aug,
    • author = {Hori, Chiori and Peng, Puyuang and Harwath, David and Liu, Xinyu and Ota, Kei and Jain, Siddarth and Corcodel, Radu and Jha, Devesh K. and Romeres, Diego and {Le Roux}, Jonathan},
    • title = {{Style-transfer based Speech and Audio-visual Scene understanding for Robot Action Sequence Acquisition from Videos}},
    • booktitle = {Interspeech},
    • year = 2023,
    • pages = {4663--4667},
    • month = aug,
    • doi = {10.21437/Interspeech.2023-1983},
    • url = {https://www.merl.com/publications/TR2023-104}
    • }
  •  Chakrabarty, A., Vinod, A.P., Mansour, H., Bortoff, S.A., Laughman, C.R., "Moving Horizon Estimation for Digital Twins using Deep Autoencoders", World Congress of the International Federation of Automatic Control (IFAC), Ishii, H. and Ebihara, Y. and Imura, J. and Yamakita, M., Eds., DOI: 10.1016/​j.ifacol.2023.10.207, July 2023, pp. 5500-5505.
    BibTeX TR2023-088 PDF
    • @inproceedings{Chakrabarty2023jul2,
    • author = {Chakrabarty, Ankush and Vinod, Abraham P. and Mansour, Hassan and Bortoff, Scott A. and Laughman, Christopher R.},
    • title = {{Moving Horizon Estimation for Digital Twins using Deep Autoencoders}},
    • booktitle = {World Congress of the International Federation of Automatic Control (IFAC)},
    • year = 2023,
    • editor = {Ishii, H. and Ebihara, Y. and Imura, J. and Yamakita, M.},
    • pages = {5500--5505},
    • month = jul,
    • publisher = {Elseiver},
    • doi = {10.1016/j.ifacol.2023.10.207},
    • url = {https://www.merl.com/publications/TR2023-088}
    • }
  •  Di Cairano, S., Skibik, T., Vinod, A.P., Weiss, A., Berntorp, K., "Decision Making for Automated Driving by Reachability of Parameterized Maneuvers", World Congress of the International Federation of Automatic Control (IFAC), Ishii, H. and Ebihara, Y. and Imura, J. and Yamakita, M., Eds., DOI: 10.1016/​j.ifacol.2023.10.018, July 2023, pp. 7852-7857.
    BibTeX TR2023-084 PDF
    • @inproceedings{DiCairano2023jul,
    • author = {{Di Cairano}, Stefano and Skibik, Terrence and Vinod, Abraham P. and Weiss, Avishai and Berntorp, Karl},
    • title = {{Decision Making for Automated Driving by Reachability of Parameterized Maneuvers}},
    • booktitle = {World Congress of the International Federation of Automatic Control (IFAC)},
    • year = 2023,
    • editor = {Ishii, H. and Ebihara, Y. and Imura, J. and Yamakita, M.},
    • pages = {7852--7857},
    • month = jul,
    • publisher = {Elsevier},
    • doi = {10.1016/j.ifacol.2023.10.018},
    • url = {https://www.merl.com/publications/TR2023-084}
    • }
  •  Salatiello, A., Wang, Y., Wichern, G., Koike-Akino, T., Yoshihiro, O., Kaneko, Y., Laughman, C.R., Chakrabarty, A., "Synthesizing Building Operation Data with Generative Models: VAEs, GANs, or Something In Between?", ACM e-Energy Conference, DOI: 10.1145/​3599733.3600260, June 2023.
    BibTeX TR2023-072 PDF
    • @inproceedings{Salatiello2023jun,
    • author = {Salatiello, Alessandro and Wang, Ye and Wichern, Gordon and Koike-Akino, Toshiaki and Yoshihiro, Ohta and Kaneko, Yosuke and Laughman, Christopher R. and Chakrabarty, Ankush},
    • title = {{Synthesizing Building Operation Data with Generative Models: VAEs, GANs, or Something In Between?}},
    • booktitle = {ACM e-Energy Conference},
    • year = 2023,
    • month = jun,
    • doi = {10.1145/3599733.3600260},
    • url = {https://www.merl.com/publications/TR2023-072}
    • }
  •  Hu, H., Menner, M., Wang, Y., Fang, H., Sun, D., Takegami, T., "Simulator-based Mission Optimization for Conceptual Aircraft Design with Turboelectric Propulsion", AIAA/IEEE Electric Aircraft Technologies Symposium (EATS), DOI: 10.2514/​6.2023-3872, June 2023, pp. 3872.
    BibTeX TR2023-069 PDF
    • @inproceedings{Hu2023jun,
    • author = {Hu, Hanyao and Menner, Marcel and Wang, Yebin and Fang, Huazhen and Sun, Dengfeng and Takegami, Tomoki},
    • title = {{Simulator-based Mission Optimization for Conceptual Aircraft Design with Turboelectric Propulsion}},
    • booktitle = {AIAA/IEEE Electric Aircraft Technologies Symposium (EATS)},
    • year = 2023,
    • pages = 3872,
    • month = jun,
    • doi = {10.2514/6.2023-3872},
    • url = {https://www.merl.com/publications/TR2023-069}
    • }
  •  Wu, S.-L., Chang, X., Wichern, G., Jung, J.-W., Germain, F., Le Roux, J., Watanabe, S., "BEATs-based Audio Captioning Model with Instructor Embedding Supervision and ChatGPT Mix-up," Tech. Rep. TR2023-068, DCASE2023 Challenge, May 2023.
    BibTeX TR2023-068 PDF
    • @techreport{Wu2023may,
    • author = {Wu, Shih-Lun and Chang, Xuankai and Wichern, Gordon and Jung, Jee-weon and Germain, Francois and {Le Roux}, Jonathan and Watanabe, Shinji},
    • title = {{BEATs-based Audio Captioning Model with Instructor Embedding Supervision and ChatGPT Mix-up}},
    • institution = {DCASE2023 Challenge},
    • year = 2023,
    • month = may,
    • url = {https://www.merl.com/publications/TR2023-068}
    • }
  •  Ota, K., Tung, H.-Y., Smith, K., Cherian, A., Marks, T.K., Sullivan, A., Kanezaki, A., Tenenbaum, J.B., "H-SAUR: Hypothesize, Simulate, Act, Update, and Repeat for Understanding Object Articulations from Interactions", IEEE International Conference on Robotics and Automation (ICRA), DOI: 10.1109/​ICRA48891.2023.10160575, May 2023, pp. 7272-7278.
    BibTeX TR2023-009 PDF
    • @inproceedings{Ota2023may,
    • author = {Ota, Kei and Tung, Hsiao-Yu and Smith, Kevin and Cherian, Anoop and Marks, Tim K. and Sullivan, Alan and Kanezaki, Asako and Tenenbaum, Joshua B.},
    • title = {{H-SAUR: Hypothesize, Simulate, Act, Update, and Repeat for Understanding Object Articulations from Interactions}},
    • booktitle = {IEEE International Conference on Robotics and Automation (ICRA)},
    • year = 2023,
    • pages = {7272--7278},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICRA48891.2023.10160575},
    • url = {https://www.merl.com/publications/TR2023-009}
    • }
  •  Shirai, Y., Jha, D.K., Raghunathan, A., Hong, D., "Tactile Tool Manipulation", IEEE International Conference on Robotics and Automation (ICRA), DOI: 10.1109/​ICRA48891.2023.10160480, May 2023, pp. 12597-12603.
    BibTeX TR2023-023 PDF Video
    • @inproceedings{Shirai2023may2,
    • author = {Shirai, Yuki and Jha, Devesh K. and Raghunathan, Arvind and Hong, Dennis},
    • title = {{Tactile Tool Manipulation}},
    • booktitle = {IEEE International Conference on Robotics and Automation (ICRA)},
    • year = 2023,
    • pages = {12597--12603},
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICRA48891.2023.10160480},
    • isbn = {979-8-3503-2365-8},
    • url = {https://www.merl.com/publications/TR2023-023}
    • }
  •  Shirai, Y., Jha, D.K., Raghunathan, A., Hong, D., "Closed-Loop Tactile Controller for Tool Manipulation", ICRA 2023 Workshop on Embracing contacts. Making robots physically interact with our world, May 2023.
    BibTeX TR2023-043 PDF Video
    • @inproceedings{Shirai2023may,
    • author = {Shirai, Yuki and Jha, Devesh K. and Raghunathan, Arvind and Hong, Dennis},
    • title = {{Closed-Loop Tactile Controller for Tool Manipulation}},
    • booktitle = {ICRA 2023 Workshop on Embracing contacts. Making robots physically interact with our world},
    • year = 2023,
    • month = may,
    • url = {https://www.merl.com/publications/TR2023-043}
    • }
  •  Shah, A., Roy, A., Shah, K., Mishra, S.K., Jacobs, D., Cherian, A., Chellappa, R., "HaLP: Hallucinating Latent Positives for Skeleton-based Self-Supervised Learning of Actions", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), May 2023, pp. 18846-18856.
    BibTeX TR2023-035 PDF
    • @inproceedings{Shah2023may,
    • author = {Shah, Anshul and Roy, Aniket and Shah, Ketul and Mishra, Shlok Kumar and Jacobs, David and Cherian, Anoop and Chellappa, Rama},
    • title = {{HaLP: Hallucinating Latent Positives for Skeleton-based Self-Supervised Learning of Actions}},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2023,
    • pages = {18846--18856},
    • month = may,
    • publisher = {CVF},
    • url = {https://www.merl.com/publications/TR2023-035}
    • }
  •  Cherian, A., Peng, K.-C., Lohit, S., Smith, K., Tenenbaum, J.B., "Are Deep Neural Networks SMARTer than Second Graders?", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), March 2023, pp. 10834-10844.
    BibTeX TR2023-014 PDF Video Data Software Presentation
    • @inproceedings{Cherian2023mar,
    • author = {Cherian, Anoop and Peng, Kuan-Chuan and Lohit, Suhas and Smith, Kevin and Tenenbaum, Joshua B.},
    • title = {{Are Deep Neural Networks SMARTer than Second Graders?}},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2023,
    • pages = {10834--10844},
    • month = mar,
    • publisher = {CVF},
    • url = {https://www.merl.com/publications/TR2023-014}
    • }