Publications

Karafiat, M., Baskar, M.K., Watanabe, S., Hori, T., Wiesner, M., Cernocky, J.H., "Analysis of Multilingual Sequence-to-Sequence Speech Recognition Systems", Interspeech, DOI: 10.21437/Interspeech.2019-2355//, September 2019, pp. 2019-2355.
BibTeX TR2019-103 PDF
- @inproceedings{Karafiat2019sep,
- author = {Karafiat, Martin and Baskar, Murali Karthick and Watanabe, Shinji and Hori, Takaaki and Wiesner, Matthew and Cernocky, Jan, Honza},
- title = {{Analysis of Multilingual Sequence-to-Sequence Speech Recognition Systems}},
- booktitle = {Interspeech},
- year = 2019,
- pages = {2019--2355},
- month = sep,
- doi = {10.21437/Interspeech.2019-2355//},
- url = {https://www.merl.com/publications/TR2019-103}
- }
Zhang, S., Zhang, S., Wang, B., Habetler, T., "Deep Learning Algorithms for Bearing Fault Diagnostics — A Review", Symposium on Diagnostics for Electric Machines, Power Electronic and Drives (SDEMPED), DOI: 10.1109/DEMPED.2019.8864915, August 2019, pp. 257-263.
BibTeX TR2019-084 PDF
- @inproceedings{Zhang2019aug,
- author = {Zhang, Shen and Zhang, Shibo and Wang, Bingnan and Habetler, Thomas},
- title = {{Deep Learning Algorithms for Bearing Fault Diagnostics — A Review}},
- booktitle = {Symposium on Diagnostics for Electric Machines, Power Electronic and Drives (SDEMPED)},
- year = 2019,
- pages = {257--263},
- month = aug,
- doi = {10.1109/DEMPED.2019.8864915},
- url = {https://www.merl.com/publications/TR2019-084}
- }
Wang, J., Cherian, A., "Discriminative Video Representation Learning Using Support Vector Classifiers", IEEE Transactions on Pattern Analysis and Machine Intelligence, DOI: 10.1109/TPAMI.2019.2937292, August 2019.
BibTeX TR2019-107 PDF
- @article{Wang2019aug,
- author = {Wang, Jue and Cherian, Anoop},
- title = {{Discriminative Video Representation Learning Using Support Vector Classifiers}},
- journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence},
- year = 2019,
- month = aug,
- doi = {10.1109/TPAMI.2019.2937292},
- url = {https://www.merl.com/publications/TR2019-107}
- }
Li, Z., Chu, T., Kalabić, U., "Dynamics-Enabled Safe Deep Reinforcement Learning: Case Study on Active Suspension Control", IEEE Conference on Control Technology and Applications (CCTA), DOI: 10.1109/CCTA.2019.8920696, August 2019, pp. 585-591.
BibTeX TR2019-082 PDF
- @inproceedings{Li2019aug,
- author = {Li, Zhaojian and Chu, Tianshu and Kalabić, Uroš},
- title = {{Dynamics-Enabled Safe Deep Reinforcement Learning: Case Study on Active Suspension Control}},
- booktitle = {Proc. IEEE Conf. Control Technology and Applications},
- year = 2019,
- pages = {585--591},
- month = aug,
- doi = {10.1109/CCTA.2019.8920696},
- url = {https://www.merl.com/publications/TR2019-082}
- }
Takahashi, T., Sun, H., Tian, D., Wang, Y., "Learning Heuristic Functions for Mobile Robot Path Planning Using Deep Neural Networks", International Conference on Automated Planning and Scheduling (ICAPS), July 2019, pp. 764-772.
BibTeX TR2019-072 PDF
- @inproceedings{Takahashi2019jul,
- author = {Takahashi, Takeshi and Sun, He and Tian, Dong and Wang, Yebin},
- title = {{Learning Heuristic Functions for Mobile Robot Path Planning Using Deep Neural Networks}},
- booktitle = {International Conference on Automated Planning and Scheduling (ICAPS)},
- year = 2019,
- pages = {764--772},
- month = jul,
- publisher = {AAAI},
- url = {https://www.merl.com/publications/TR2019-072}
- }
Lee, T.-Y., van Baar, J., Wittenburg, K.B., Sullivan, A., "Analysis of the contribution and temporal dependency of LSTM layers for reinforcement learning tasks", IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Explanable AI Workshop, June 2019, pp. 99-102.
BibTeX TR2019-049 PDF
- @inproceedings{Lee2019jun2,
- author = {Lee, Teng-Yok and {van Baar}, Jeroen and Wittenburg, Kent B. and Sullivan, Alan},
- title = {{Analysis of the contribution and temporal dependency of LSTM layers for reinforcement learning tasks}},
- booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Explanable AI Workshop},
- year = 2019,
- pages = {99--102},
- month = jun,
- url = {https://www.merl.com/publications/TR2019-049}
- }
Duan, C., Chen, S., Tian, D., Moura, J., Kovacevic, J., "Deep Graph Topology Learning for 3D Point Cloud Reconstruction", Graph Signal Processing Workshop (GSP), June 2019.
BibTeX TR2019-046 PDF
- @inproceedings{Duan2019jun,
- author = {Duan, Chaojing and Chen, Siheng and Tian, Dong and Moura, Jose and Kovacevic, Jelena},
- title = {{Deep Graph Topology Learning for 3D Point Cloud Reconstruction}},
- booktitle = {Graph Signal Processing Workshop (GSP)},
- year = 2019,
- month = jun,
- url = {https://www.merl.com/publications/TR2019-046}
- }
Matsumine, T., Koike-Akino, T., Wang, Y., "Deep Learning-Based Constellation Optimization for Physical Network Coding in Two-Way Relay Networks", IEEE International Conference on Communications (ICC), DOI: 10.1109/ICC.2019.8761963, June 2019.
BibTeX TR2019-025 PDF
- @inproceedings{Matsumine2019jun,
- author = {Matsumine, Toshiki and Koike-Akino, Toshiaki and Wang, Ye},
- title = {{Deep Learning-Based Constellation Optimization for Physical Network Coding in Two-Way Relay Networks}},
- booktitle = {IEEE International Conference on Communications (ICC)},
- year = 2019,
- month = jun,
- doi = {10.1109/ICC.2019.8761963},
- issn = {1938-1883},
- isbn = {978-1-5386-8088-9},
- url = {https://www.merl.com/publications/TR2019-025}
- }
van Baar, J., Sullivan, A., Corcodel, R., Jha, D.K., Romeres, D., Nikovski, D.N., "Sim-to-Real Transfer Learning using Robustified Controllers in Robotic Tasks involving Complex Dynamics", IEEE International Conference on Robotics and Automation (ICRA), DOI: 10.1109/ICRA.2019.8793561, May 2019, pp. 6001-6007.
BibTeX TR2018-202 PDF Video Software
- @inproceedings{vanBaar2019may,
- author = {{van Baar}, Jeroen and Sullivan, Alan and Corcodel, Radu and Jha, Devesh K. and Romeres, Diego and Nikovski, Daniel N.},
- title = {{Sim-to-Real Transfer Learning using Robustified Controllers in Robotic Tasks involving Complex Dynamics}},
- booktitle = {IEEE International Conference on Robotics and Automation (ICRA)},
- year = 2019,
- pages = {6001--6007},
- month = may,
- doi = {10.1109/ICRA.2019.8793561},
- url = {https://www.merl.com/publications/TR2018-202}
- }
Aihara, R., Hanazawa, T., Okato, Y., Wichern, G., Le Roux, J., "Teacher-Student Deep Clustering For Low-Delay Channel Speech Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2019.8682695, May 2019.
BibTeX TR2019-003 PDF
- @inproceedings{Aihara2019may,
- author = {Aihara, Ryo and Hanazawa, Toshiyuki and Okato, Yohei and Wichern, Gordon and {Le Roux}, Jonathan},
- title = {{Teacher-Student Deep Clustering For Low-Delay Channel Speech Separation}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2019,
- month = may,
- doi = {10.1109/ICASSP.2019.8682695},
- url = {https://www.merl.com/publications/TR2019-003}
- }
Le Roux, J., Wichern, G., Watanabe, S., Sarroff, A., Hershey, J., "The Phasebook: Building Complex Masks via Discrete Representations for Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2019.8682587, May 2019.
BibTeX TR2019-008 PDF
- @inproceedings{LeRoux2019may2,
- author = {{Le Roux}, Jonathan and Wichern, Gordon and Watanabe, Shinji and Sarroff, Andy and Hershey, John},
- title = {{The Phasebook: Building Complex Masks via Discrete Representations for Source Separation}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2019,
- month = may,
- doi = {10.1109/ICASSP.2019.8682587},
- url = {https://www.merl.com/publications/TR2019-008}
- }
Lohit, S., Liu, D., Mansour, H., Boufounos, P.T., "Unrolled Projected Gradient Descent for Multi-Spectral Image Fusion", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2019.8683124, May 2019.
BibTeX TR2019-010 PDF
- @inproceedings{Lohit2019may,
- author = {Lohit, Suhas and Liu, Dehong and Mansour, Hassan and Boufounos, Petros T.},
- title = {{Unrolled Projected Gradient Descent for Multi-Spectral Image Fusion}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2019,
- month = may,
- doi = {10.1109/ICASSP.2019.8683124},
- url = {https://www.merl.com/publications/TR2019-010}
- }
Seetharaman, P., Wichern, G., Le Roux, J., Pardo, B., "Bootstrapping Single-Channel Source Separation via Unsupervised Spatial Clustering on Stereo Mixtures", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2019.8683198, May 2019.
BibTeX TR2019-014 PDF
- @inproceedings{Seetharaman2019may2,
- author = {Seetharaman, Prem and Wichern, Gordon and {Le Roux}, Jonathan and Pardo, Bryan},
- title = {{Bootstrapping Single-Channel Source Separation via Unsupervised Spatial Clustering on Stereo Mixtures}},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2019,
- month = may,
- doi = {10.1109/ICASSP.2019.8683198},
- url = {https://www.merl.com/publications/TR2019-014}
- }
Seetharaman, P., Wichern, G., Venkataramani, S., Le Roux, J., "Class-Conditional Embeddings for Music Source Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP.2019.8683007, May 2019.
BibTeX TR2019-004 PDF
- @inproceedings{Seetharaman2019may,
- author = {Seetharaman, Prem and Wichern, Gordon and Venkataramani, Shrikant and {Le Roux}, Jonathan},
- title = {{Class-Conditional Embeddings for Music Source Separation }},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2019,
- month = may,
- doi = {10.1109/ICASSP.2019.8683007},
- url = {https://www.merl.com/publications/TR2019-004}
- }
Ozdenizci, O., Wang, Y., Koike-Akino, T., Erdogmus, D., "Adversarial Deep Learning in EEG Biometrics", IEEE Signal Processing Letters, DOI: 10.1109/LSP.2019.2906826, Vol. 26, No. 5, pp. 710-714, March 2019.
BibTeX TR2019-017 PDF
- @article{Ozdenizci2019mar2,
- author = {Ozdenizci, Ozan and Wang, Ye and Koike-Akino, Toshiaki and Erdogmus, Deniz},
- title = {{Adversarial Deep Learning in EEG Biometrics}},
- journal = {IEEE Signal Processing Letters},
- year = 2019,
- volume = 26,
- number = 5,
- pages = {710--714},
- month = mar,
- doi = {10.1109/LSP.2019.2906826},
- url = {https://www.merl.com/publications/TR2019-017}
- }
Le Roux, J., Wichern, G., Watanabe, S., Sarroff, A., Hershey, J., "Phasebook and Friends: Leveraging discrete representations for source separation", IEEE Journal of Selected Topics in Signal Processing, DOI: 10.1109/JSTSP.2019.2904183, Vol. 13, No. 2, pp. 370-382, March 2019.
BibTeX TR2018-199 PDF
- @article{LeRoux2019mar,
- author = {{Le Roux}, Jonathan and Wichern, Gordon and Watanabe, Shinji and Sarroff, Andy and Hershey, John},
- title = {{Phasebook and Friends: Leveraging discrete representations for source separation}},
- journal = {IEEE Journal of Selected Topics in Signal Processing},
- year = 2019,
- volume = 13,
- number = 2,
- pages = {370--382},
- month = mar,
- doi = {10.1109/JSTSP.2019.2904183},
- url = {https://www.merl.com/publications/TR2018-199}
- }
TaherSima, M., Kojima, K., Koike-Akino, T., Jha, D., Wang, B., Lin, C., Parsons, K., "Deep Neural Network Inverse Design of Integrated Photonic Power Splitters", Nature Scientific Reports, DOI: 10.1038/s41598-018-37952-2, Vol. 9, pp. 1368, December 2018.
BibTeX TR2018-180 PDF
- @article{TaherSima2018dec,
- author = {TaherSima, Mohammad and Kojima, Keisuke and Koike-Akino, Toshiaki and Jha, Devesh and Wang, Bingnan and Lin, Chungwei and Parsons, Kieran},
- title = {{Deep Neural Network Inverse Design of Integrated Photonic Power Splitters}},
- journal = {Nature Scientific Reports},
- year = 2018,
- volume = 9,
- pages = 1368,
- month = dec,
- doi = {10.1038/s41598-018-37952-2},
- issn = {2045-2322},
- url = {https://www.merl.com/publications/TR2018-180}
- }
Paul, S., van Baar, J., "Trajectory-based Learning for Ball-in-Maze Games", NIPS Workshop on Imitation Learning and its Challenges in Robotics, December 2018.
BibTeX TR2018-158 PDF
- @inproceedings{Paul2018dec,
- author = {Paul, Sujoy and {van Baar}, Jeroen},
- title = {{Trajectory-based Learning for Ball-in-Maze Games}},
- booktitle = {NIPS Workshop on Imitation Learning and its Challenges in Robotics},
- year = 2018,
- month = dec,
- url = {https://www.merl.com/publications/TR2018-158}
- }
Jha, D.K., Romeres, D., van Baar, J., Sullivan, A., Nikovski, D.N., "Learning Tasks in a Complex Circular Maze Environment", NIPS Workshop on Modeling the Physical World: Perception, Learning, and Control, December 2018.
BibTeX TR2018-169 PDF
- @inproceedings{vanBaar2018dec,
- author = {Jha, Devesh K. and Romeres, Diego and {van Baar}, Jeroen and Sullivan, Alan and Nikovski, Daniel N.},
- title = {{Learning Tasks in a Complex Circular Maze Environment}},
- booktitle = {NIPS Workshop on Modeling the Physical World: Perception, Learning, and Control},
- year = 2018,
- month = dec,
- url = {https://www.merl.com/publications/TR2018-169}
- }
Wichern, G., Le Roux, J., "Phase Reconstruction with Learned Time-Frequency Representations for Single-Channel Speech Separation", International Workshop on Acoustic Signal Enhancement (IWAENC), DOI: 10.1109/IWAENC.2018.8521243, September 2018.
BibTeX TR2018-146 PDF
- @inproceedings{Wichern2018sep,
- author = {Wichern, Gordon and {Le Roux}, Jonathan},
- title = {{Phase Reconstruction with Learned Time-Frequency Representations for Single-Channel Speech Separation}},
- booktitle = {International Workshop on Acoustic Signal Enhancement (IWAENC)},
- year = 2018,
- month = sep,
- doi = {10.1109/IWAENC.2018.8521243},
- url = {https://www.merl.com/publications/TR2018-146}
- }
Wang, J., Cherian, A., "Learning Discriminative Video Representations Using Adversarial Perturbations", European Conference on Computer Vision (ECCV), September 2018.
BibTeX TR2018-139 PDF Software
- @inproceedings{Wang2018sep3,
- author = {Wang, Jue and Cherian, Anoop},
- title = {{Learning Discriminative Video Representations Using Adversarial Perturbations}},
- booktitle = {European Conference on Computer Vision (ECCV)},
- year = 2018,
- month = sep,
- url = {https://www.merl.com/publications/TR2018-139}
- }
Kocanaogullari, A., Ataer-Cansizoglu, E., "Active Descriptor Learning for Feature Matching", International Workshop on Compact and Efficient Feature Representation and Learning in Computer Vision, September 2018.
BibTeX TR2018-132 PDF
- @inproceedings{Kocanaogullari2018sep,
- author = {Kocanaogullari, Aziz and Ataer-Cansizoglu, Esra},
- title = {{Active Descriptor Learning for Feature Matching}},
- booktitle = {International Workshop on Compact and Efficient Feature Representation and Learning in Computer Vision},
- year = 2018,
- month = sep,
- url = {https://www.merl.com/publications/TR2018-132}
- }
Wang, Z.-Q., Le Roux, J., Wang, D., Hershey, J., "End-to-End Speech Separation with Unfolded Iterative Phase Reconstruction", Interspeech, September 2018.
BibTeX TR2018-135 PDF
- @inproceedings{Wang2018sep,
- author = {Wang, Zhong-Qiu and {Le Roux}, Jonathan and Wang, DeLiang and Hershey, John},
- title = {{End-to-End Speech Separation with Unfolded Iterative Phase Reconstruction}},
- booktitle = {Interspeech},
- year = 2018,
- month = sep,
- url = {https://www.merl.com/publications/TR2018-135}
- }
Watanabe, S., Hori, T., Karita, S., Hayashi, T., Nishitoba, J., Unno, Y., Enrique Yalta Soplin, N., Heymann, J., Wiesner, M., Chen, N., Renduchintala, A., Ochiai, T., "ESPnet: End-to-End Speech Processing Toolkit", Interspeech, September 2018.
BibTeX TR2018-136 PDF
- @inproceedings{Watanabe2018sep,
- author = {Watanabe, Shinji and Hori, Takaaki and Karita, Shigeki and Hayashi, Tomoki and Nishitoba, Jiro and Unno, Yuya and Enrique Yalta Soplin, Nelson and Heymann, Jahn and Wiesner, Matthew and Chen, Nanxin and Renduchintala, Adithya and Ochiai, Tsubasa},
- title = {{ESPnet: End-to-End Speech Processing Toolkit}},
- booktitle = {Interspeech},
- year = 2018,
- month = sep,
- url = {https://www.merl.com/publications/TR2018-136}
- }
Ataer-Cansizoglu, E., Jones, M.J., Zhang, Z., Sullivan, A., "Verification of Very Low-Resolution Faces Using An Identity-Preserving Deep Face Super-resolution Network", arXiv, August 2018.
BibTeX arXiv
- @article{Ataer-Cansizoglu2018aug,
- author = {Ataer-Cansizoglu, Esra and Jones, Michael J. and Zhang, Ziming and Sullivan, Alan},
- title = {{Verification of Very Low-Resolution Faces Using An Identity-Preserving Deep Face Super-resolution Network}},
- journal = {arXiv},
- year = 2018,
- month = aug,
- url = {https://arxiv.org/abs/1903.10974}
- }