Publications

661 / 3,813 publications found.


  •  Cherian, A., Chatterjee, M., Ahuja, N., "Sound2Sight: Generating Visual Dynamics from Sound and Context", European Conference on Computer Vision (ECCV), Vedaldi, A. and Bischof, H. and Brox, Th. and Frahm, J.-M., Eds., August 2020.
    BibTeX TR2020-121 PDF Software
    • @inproceedings{Cherian2020aug,
    • author = {Cherian, Anoop and Chatterjee, Moitreya and Ahuja, Narendra},
    • title = {{Sound2Sight: Generating Visual Dynamics from Sound and Context}},
    • booktitle = {European Conference on Computer Vision (ECCV)},
    • year = 2020,
    • editor = {Vedaldi, A. and Bischof, H. and Brox, Th. and Frahm, J.-M.},
    • month = aug,
    • publisher = {Springer},
    • url = {https://www.merl.com/publications/TR2020-121}
    • }
  •  Han, M., Ozdenizci, O., Wang, Y., Koike-Akino, T., Erdogmus, D., "Disentangled Adversarial Transfer Learning for Physiological Biosignals", International Conference of the IEEE Engineering in Medicine and Biology Society (EMBC), DOI: 10.1109/​EMBC44109.2020.9175233, July 2020.
    BibTeX TR2020-109 PDF Video Presentation
    • @inproceedings{Han2020jul,
    • author = {Han, Mo and Ozdenizci, Ozan and Wang, Ye and Koike-Akino, Toshiaki and Erdogmus, Deniz},
    • title = {{Disentangled Adversarial Transfer Learning for Physiological Biosignals}},
    • booktitle = {International Conference of the IEEE Engineering in Medicine and Biology Society (EMBC)},
    • year = 2020,
    • month = jul,
    • publisher = {IEEE},
    • doi = {10.1109/EMBC44109.2020.9175233},
    • issn = {1558-4615},
    • isbn = {978-1-7281-1990-8},
    • url = {https://www.merl.com/publications/TR2020-109}
    • }
  •  Seetharaman, P., Wichern, G., Le Roux, J., Pardo, B., "Bootstrapping Unsupervised Deep Music Separation from Primitive Auditory Grouping Principles", ICML 2020 Workshop on Self-supervision in Audio and Speech, July 2020.
    BibTeX TR2020-111 PDF
    • @inproceedings{Seetharaman2020jul,
    • author = {Seetharaman, Prem and Wichern, Gordon and {Le Roux}, Jonathan and Pardo, Bryan},
    • title = {{Bootstrapping Unsupervised Deep Music Separation from Primitive Auditory Grouping Principles}},
    • booktitle = {ICML 2020 Workshop on Self-supervision in Audio and Speech},
    • year = 2020,
    • month = jul,
    • url = {https://www.merl.com/publications/TR2020-111}
    • }
  •  Cherian, A., Aeron, S., "Representation Learning via Adversarially-Contrastive Optimal Transport", International Conference on Machine Learning (ICML), Daumé, H. and Singh, A., Eds., July 2020, pp. 10675-10685.
    BibTeX TR2020-093 PDF Software
    • @inproceedings{Cherian2020jul,
    • author = {Cherian, Anoop and Aeron, Shuchin},
    • title = {{Representation Learning via Adversarially-Contrastive Optimal Transport}},
    • booktitle = {International Conference on Machine Learning (ICML)},
    • year = 2020,
    • editor = {Daumé, H. and Singh, A.},
    • pages = {10675--10685},
    • month = jul,
    • url = {https://www.merl.com/publications/TR2020-093}
    • }
  •  Koike-Akino, T., Wang, Y., "Stochastic Bottleneck: Rateless Auto-Encoder for Flexible Dimensionality Reduction", IEEE International Symposium on Information Theory (ISIT), DOI: 10.1109/​ISIT44484.2020.9174523, June 2020.
    BibTeX TR2020-075 PDF Video Presentation
    • @inproceedings{Koike-Akino2020jun,
    • author = {Koike-Akino, Toshiaki and Wang, Ye},
    • title = {{Stochastic Bottleneck: Rateless Auto-Encoder for Flexible Dimensionality Reduction}},
    • booktitle = {IEEE International Symposium on Information Theory (ISIT)},
    • year = 2020,
    • month = jun,
    • publisher = {IEEE},
    • doi = {10.1109/ISIT44484.2020.9174523},
    • issn = {2157-8117},
    • isbn = {978-1-7281-6432-8},
    • url = {https://www.merl.com/publications/TR2020-075}
    • }
  •  Hu, Y., Chen, S., Zhang, Y., Gu, X., "Collaborative Motion Prediction via Neural Motion Message Passing", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/​CVPR42600.2020.00635, June 2020, pp. 6318-6327.
    BibTeX TR2020-072 PDF
    • @inproceedings{Hu2020jun,
    • author = {Hu, Yue and Chen, Siheng and Zhang, Ya and Gu, Xiao},
    • title = {{Collaborative Motion Prediction via Neural Motion Message Passing}},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2020,
    • pages = {6318--6327},
    • month = jun,
    • doi = {10.1109/CVPR42600.2020.00635},
    • url = {https://www.merl.com/publications/TR2020-072}
    • }
  •  Li, M., Chen, S., Zhao, Y., Zhang, Y., Wang, Y., Tia, Q., "Dynamic Multiscale Graph Neural Networks for 3D Skeleton-Based Human Motion Prediction", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/​CVPR42600.2020.00029, June 2020, pp. 211-220.
    BibTeX TR2020-073 PDF
    • @inproceedings{Li2020jun,
    • author = {Li, Maosen and Chen, Sihen and Zhao, Yangheng and Zhang, Ya and Wang, Yanfeng and Tia, Qi},
    • title = {{Dynamic Multiscale Graph Neural Networks for 3D Skeleton-Based Human Motion Prediction}},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2020,
    • pages = {211--220},
    • month = jun,
    • doi = {10.1109/CVPR42600.2020.00029},
    • url = {https://www.merl.com/publications/TR2020-073}
    • }
  •  Wang, Y., Koike-Akino, T., "Learning to Modulate for Non-coherent MIMO", IEEE International Conference on Communications (ICC), DOI: 10.1109/​ICC40277.2020.9149438, June 2020.
    BibTeX TR2020-071 PDF Video Presentation
    • @inproceedings{Wang2020jun,
    • author = {Wang, Ye and Koike-Akino, Toshiaki},
    • title = {{Learning to Modulate for Non-coherent MIMO}},
    • booktitle = {IEEE International Conference on Communications (ICC)},
    • year = 2020,
    • month = jun,
    • publisher = {IEEE},
    • doi = {10.1109/ICC40277.2020.9149438},
    • issn = {1938-1883},
    • isbn = {978-1-7281-5089-5},
    • url = {https://www.merl.com/publications/TR2020-071}
    • }
  •  Kumar, A., Marks, T.K., Mou, W., Wang, Y., Cherian, A., Jones, M.J., Liu, X., Koike-Akino, T., Feng, C., "LUVLi Face Alignment: Estimating Landmarks’ Location, Uncertainty, and Visibility Likelihood", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/​CVPR42600.2020.00826, June 2020.
    BibTeX TR2020-067 PDF Video Data Software
    • @inproceedings{Kumar2020jun,
    • author = {Kumar, Abhinav and Marks, Tim K. and Mou, Wenxuan and Wang, Ye and Cherian, Anoop and Jones, Michael J. and Liu, Xiaoming and Koike-Akino, Toshiaki and Feng, Chen},
    • title = {{LUVLi Face Alignment: Estimating Landmarks’ Location, Uncertainty, and Visibility Likelihood}},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2020,
    • month = jun,
    • publisher = {IEEE},
    • doi = {10.1109/CVPR42600.2020.00826},
    • issn = {2575-7075},
    • isbn = {978-1-7281-7168-5},
    • url = {https://www.merl.com/publications/TR2020-067}
    • }
  •  Wu, P., Chen, S., "MotionNet: Joint Perception and Motion Prediction for Autonomous Driving Based on Bird’s Eye View Maps", IEEE Conference on Computer Vision and Pattern Recognition (CVPR), DOI: 10.1109/​CVPR42600.2020.01140, June 2020, pp. 11382-11392.
    BibTeX TR2020-068 PDF Data Software
    • @inproceedings{Wu2020jun,
    • author = {Wu, Pengxiang and Chen, Siheng},
    • title = {{MotionNet: Joint Perception and Motion Prediction for Autonomous Driving Based on Bird’s Eye View Maps}},
    • booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
    • year = 2020,
    • pages = {11382--11392},
    • month = jun,
    • doi = {10.1109/CVPR42600.2020.01140},
    • url = {https://www.merl.com/publications/TR2020-068}
    • }
  •  Chen, S., Liu, B., Feng, C., Vallespi-Gonzalez, C., Wellington, C., "3D Point Cloud Processing and Learning for Autonomous Driving", IEEE Signal Processing Magazine, DOI: 10.1109/​MSP.2020.2984780, Vol. 38, No. 1, pp. 68-86, May 2020.
    BibTeX TR2020-066 PDF
    • @article{Chen2020may2,
    • author = {Chen, Siheng and Liu, Baoan and Feng, Chen and Vallespi-Gonzalez, Carlos and Wellington, Carl},
    • title = {{3D Point Cloud Processing and Learning for Autonomous Driving}},
    • journal = {IEEE Signal Processing Magazine},
    • year = 2020,
    • volume = 38,
    • number = 1,
    • pages = {68--86},
    • month = may,
    • doi = {10.1109/MSP.2020.2984780},
    • url = {https://www.merl.com/publications/TR2020-066}
    • }
  •  Fujihashi, T., Koike-Akino, T., Watanabe, T., Orlik, P.V., "High-Quality Soft Image Delivery with Deep Image Denoising", IEEE International Conference on Communications (ICC), DOI: 10.1109/​ICC40277.2020.9148611, May 2020.
    BibTeX TR2020-060 PDF Video
    • @inproceedings{Fujihashi2020may,
    • author = {Fujihashi, Takuya and Koike-Akino, Toshiaki and Watanabe, Takashi and Orlik, Philip V.},
    • title = {{High-Quality Soft Image Delivery with Deep Image Denoising}},
    • booktitle = {IEEE International Conference on Communications (ICC)},
    • year = 2020,
    • month = may,
    • publisher = {IEEE},
    • doi = {10.1109/ICC40277.2020.9148611},
    • issn = {1938-1883},
    • isbn = {978-1-7281-5089-5},
    • url = {https://www.merl.com/publications/TR2020-060}
    • }
  •  Bhamidipati, S., Kim, K.J., Sun, H., Orlik, P.V., "Artificial Intelligence-Based Distributed Belief Propagation and Recurrent Neural Network Algorithm for Wide-Area Monitoring Systems", IEEE Network, DOI: 10.1109/​MNET.011.1900322, Vol. 34, No. 3, pp. 64-72, May 2020.
    BibTeX TR2020-058 PDF
    • @article{Bhamidipati2020may,
    • author = {Bhamidipati, Sriramya and Kim, Kyeong Jin and Sun, Hongbo and Orlik, Philip V.},
    • title = {{Artificial Intelligence-Based Distributed Belief Propagation and Recurrent Neural Network Algorithm for Wide-Area Monitoring Systems}},
    • journal = {IEEE Network},
    • year = 2020,
    • volume = 34,
    • number = 3,
    • pages = {64--72},
    • month = may,
    • doi = {10.1109/MNET.011.1900322},
    • url = {https://www.merl.com/publications/TR2020-058}
    • }
  •  Ozdenizci, O., Wang, Y., Koike-Akino, T., Erdogmus, D., "Learning Invariant Representations from EEG via Adversarial Inference", IEEE Access, DOI: 10.1109/​ACCESS.2020.2971600, Vol. 8, pp. 27074-27085, April 2020.
    BibTeX TR2020-049 PDF
    • @article{Ozdenizci2020apr,
    • author = {Ozdenizci, Ozan and Wang, Ye and Koike-Akino, Toshiaki and Erdogmus, Deniz},
    • title = {{Learning Invariant Representations from EEG via Adversarial Inference}},
    • journal = {IEEE Access},
    • year = 2020,
    • volume = 8,
    • pages = {27074--27085},
    • month = apr,
    • doi = {10.1109/ACCESS.2020.2971600},
    • issn = {2169-3536},
    • url = {https://www.merl.com/publications/TR2020-049}
    • }
  •  Chang, X., Zhang, W., Qian, Y., Le Roux, J., Watanabe, S., "End-To-End Multi-Speaker Speech Recognition with Transformer", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP40776.2020.9054029, April 2020, pp. 6134-6138.
    BibTeX TR2020-043 PDF Video Presentation
    • @inproceedings{Chang2020apr,
    • author = {Chang, Xuankai and Zhang, Wangyou and Qian, Yanmin and {Le Roux}, Jonathan and Watanabe, Shinji},
    • title = {{End-To-End Multi-Speaker Speech Recognition with Transformer}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2020,
    • pages = {6134--6138},
    • month = apr,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP40776.2020.9054029},
    • issn = {2379-190X},
    • isbn = {978-1-5090-6631-5},
    • url = {https://www.merl.com/publications/TR2020-043}
    • }
  •  Pishdadian, F., Wichern, G., Le Roux, J., "Learning to Separate Sounds From Weakly Labeled Scenes", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP40776.2020.9053055, April 2020, pp. 91-95.
    BibTeX TR2020-038 PDF Video Presentation
    • @inproceedings{Pishdadian2020apr,
    • author = {Pishdadian, Fatemeh and Wichern, Gordon and {Le Roux}, Jonathan},
    • title = {{Learning to Separate Sounds From Weakly Labeled Scenes}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2020,
    • pages = {91--95},
    • month = apr,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP40776.2020.9053055},
    • issn = {2379-190X},
    • isbn = {978-1-5090-6631-5},
    • url = {https://www.merl.com/publications/TR2020-038}
    • }
  •  Al-Shabili, A., Mansour, H., Boufounos, P.T., "Learning Plug-and-Play Proximal Quasi-Newton Denoisers", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP40776.2020.9054537, April 2020, pp. 8896-8900.
    BibTeX TR2020-045 PDF Video
    • @inproceedings{Al-Shabili2020apr,
    • author = {Al-Shabili, Abdullah and Mansour, Hassan and Boufounos, Petros T.},
    • title = {{Learning Plug-and-Play Proximal Quasi-Newton Denoisers}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2020,
    • pages = {8896--8900},
    • month = apr,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP40776.2020.9054537},
    • issn = {2379-190X},
    • isbn = {978-1-5090-6631-5},
    • url = {https://www.merl.com/publications/TR2020-045}
    • }
  •  Maciejewski, M., Wichern, G., McQuinn, E., Le Roux, J., "WHAMR!: Noisy and Reverberant Single-Channel Speech Separation", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP40776.2020.9053327, April 2020, pp. 696-700.
    BibTeX TR2020-042 PDF Video Presentation
    • @inproceedings{Maciejewski2020apr,
    • author = {Maciejewski, Matthew and Wichern, Gordon and McQuinn, Emmett and {Le Roux}, Jonathan},
    • title = {{WHAMR!: Noisy and Reverberant Single-Channel Speech Separation}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2020,
    • pages = {696--700},
    • month = apr,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP40776.2020.9053327},
    • issn = {2379-190X},
    • isbn = {978-1-5090-6631-5},
    • url = {https://www.merl.com/publications/TR2020-042}
    • }
  •  Moritz, N., Hori, T., Le Roux, J., "Streaming Automatic Speech Recognition With The Transformer Model", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP40776.2020.9054476, April 2020, pp. 6074-6078.
    BibTeX TR2020-040 PDF Video Presentation
    • @inproceedings{Moritz2020apr,
    • author = {Moritz, Niko and Hori, Takaaki and {Le Roux}, Jonathan},
    • title = {{Streaming Automatic Speech Recognition With The Transformer Model}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2020,
    • pages = {6074--6078},
    • month = apr,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP40776.2020.9054476},
    • issn = {2379-190X},
    • isbn = {978-1-5090-6631-5},
    • url = {https://www.merl.com/publications/TR2020-040}
    • }
  •  Sari, L., Moritz, N., Hori, T., Le Roux, J., "Unsupervised Speaker Adaptation Using Attention-Based Speaker Memory For End-To-End ASR", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP40776.2020.9054249, April 2020, pp. 7384-7388.
    BibTeX TR2020-037 PDF Video Presentation
    • @inproceedings{Sari2020apr,
    • author = {Sari, Leda and Moritz, Niko and Hori, Takaaki and {Le Roux}, Jonathan},
    • title = {{Unsupervised Speaker Adaptation Using Attention-Based Speaker Memory For End-To-End ASR}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2020,
    • pages = {7384--7388},
    • month = apr,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP40776.2020.9054249},
    • issn = {2379-190X},
    • isbn = {978-1-5090-6631-5},
    • url = {https://www.merl.com/publications/TR2020-037}
    • }
  •  Shi, L., Geng, S., Shuang, K., Hori, C., Liu, S., Gao, P., Su, S., "Multi-Layer Content Interaction Through Quaternion Product For Visual Question Answering", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/​ICASSP40776.2020.9053595, April 2020, pp. 4412-4416.
    BibTeX TR2020-046 PDF
    • @inproceedings{Shi2020apr,
    • author = {Shi, Lei and Geng, Shijie and Shuang, Kai and Hori, Chiori and Liu, Songxiang and Gao, Peng and Su, Sen},
    • title = {{Multi-Layer Content Interaction Through Quaternion Product For Visual Question Answering}},
    • booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
    • year = 2020,
    • pages = {4412--4416},
    • month = apr,
    • publisher = {IEEE},
    • doi = {10.1109/ICASSP40776.2020.9053595},
    • issn = {2379-190X},
    • isbn = {978-1-5090-6631-5},
    • url = {https://www.merl.com/publications/TR2020-046}
    • }
  •  Li, R., Wang, X., Mallidi, H., Watanabe, S., Hori, T., Hermansky, H., "Multi-Stream End-to-End Speech Recognition", IEEE/ACM Transactions on Audio, Speech and Language Processing, DOI: 10.1109/​TASLP.2019.2959721, Vol. 28, pp. 646-655, March 2020.
    BibTeX TR2020-030 PDF
    • @article{Li2020mar,
    • author = {Li, Ruizhi and Wang, Xiaofei and Mallidi, Harish and Watanabe, Shinji and Hori, Takaaki and Hermansky, Hynek},
    • title = {{Multi-Stream End-to-End Speech Recognition}},
    • journal = {IEEE/ACM Transactions on Audio, Speech and Language Processing},
    • year = 2020,
    • volume = 28,
    • pages = {646--655},
    • month = mar,
    • doi = {10.1109/TASLP.2019.2959721},
    • url = {https://www.merl.com/publications/TR2020-030}
    • }
  •  D’Haro, L.F., Yoshino, K., Hori, C., Marks, T.K., Polymenakos, L., Kummerfeld, J.K., Galley, M., Gao, X., "Overview of the seventh Dialog System Technology Challenge: DSTC7", Computer Speech and Language, DOI: 10.1016/​j.csl.2020.101068, Vol. 62, March 2020.
    BibTeX TR2020-029 PDF
    • @article{D’Haro2020mar,
    • author = {D’Haro, Luis Fernando and Yoshino, Koichiro and Hori, Chiori and Marks, Tim K. and Polymenakos, Lazaros and Kummerfeld, Jonathan K. and Galley, Michel and Gao, Xiang},
    • title = {{Overview of the seventh Dialog System Technology Challenge: DSTC7}},
    • journal = {Computer Speech and Language},
    • year = 2020,
    • volume = 62,
    • month = mar,
    • doi = {10.1016/j.csl.2020.101068},
    • url = {https://www.merl.com/publications/TR2020-029}
    • }
  •  Kojima, K., TaherSima, M., Koike-Akino, T., Jha, D.K., Tang, Y., Parsons, K., Sang, F., Klamkin, J., "Deep Neural Networks for Designing Integrated Photonics", Optical Fiber Communication Conference and Exposition (OFC), DOI: 10.1364/​OFC.2020.Th1A.6, March 2020.
    BibTeX TR2020-057 PDF
    • @inproceedings{Kojima2020mar,
    • author = {Kojima, Keisuke and TaherSima, Mohammad and Koike-Akino, Toshiaki and Jha, Devesh K. and Tang, Yingheng and Parsons, Kieran and Sang, Fengqiao and Klamkin, Jonathan},
    • title = {{Deep Neural Networks for Designing Integrated Photonics}},
    • booktitle = {Optical Fiber Communication Conference and Exposition (OFC)},
    • year = 2020,
    • month = mar,
    • publisher = {OSA},
    • doi = {10.1364/OFC.2020.Th1A.6},
    • isbn = {978-1-943580-71-2},
    • url = {https://www.merl.com/publications/TR2020-057}
    • }
  •  Tang, Y., Kojima, K., Koike-Akino, T., Wang, Y., Wu, P., TaherSima, M., Jha, D.K., Parsons, K., Qi, M., "Generative Deep Learning Model for a Multi-level NanoOptic Broadband Power Splitter", Optical Fiber Communication Conference and Exposition (OFC), DOI: 10.1364/​OFC.2020.Th1A.1, March 2020, pp. Th1A.1.
    BibTeX TR2020-025 PDF
    • @inproceedings{Tang2020mar,
    • author = {Tang, Yingheng and Kojima, Keisuke and Koike-Akino, Toshiaki and Wang, Ye and Wu, Pengxiang and TaherSima, Mohammad and Jha, Devesh K. and Parsons, Kieran and Qi, Minghao},
    • title = {{Generative Deep Learning Model for a Multi-level NanoOptic Broadband Power Splitter}},
    • booktitle = {Optical Fiber Communication Conference and Exposition (OFC)},
    • year = 2020,
    • pages = {Th1A.1},
    • month = mar,
    • publisher = {OSA},
    • doi = {10.1364/OFC.2020.Th1A.1},
    • isbn = {978-1-943580-71-2},
    • url = {https://www.merl.com/publications/TR2020-025}
    • }