- Higuchi, Y., Moritz, N., Le Roux, J., Hori, T., "Momentum Pseudo-Labeling for Semi-Supervised Speech Recognition", Interspeech, DOI: 10.21437/Interspeech.2021-571, September 2021, pp. 726-730.
BibTeX TR2021-103 PDF- @inproceedings{Higuchi2021sep,
- author = {Higuchi, Yosuke and Moritz, Niko and Le Roux, Jonathan and Hori, Takaaki},
- title = {Momentum Pseudo-Labeling for Semi-Supervised Speech Recognition},
- booktitle = {Interspeech},
- year = 2021,
- pages = {726--730},
- month = sep,
- doi = {10.21437/Interspeech.2021-571},
- url = {https://www.merl.com/publications/TR2021-103}
- }
- Liu, B., Guo, J., Koike-Akino, T., Wang, Y., Kim, K.J., Parsons, K., Orlik, P.V., Hashimoto, S., Yuan, J., "Anomaly Detection and Diagnosis Using Pre-Processing and Time-Delay Autoencoder", IEEE International conference on emerging technologies and factory automation, September 2021.
BibTeX TR2021-107 PDF- @inproceedings{Liu2021sep,
- author = {Liu, Bryan and Guo, Jianlin and Koike-Akino, Toshiaki and Wang, Ye and Kim, Kyeong Jin and Parsons, Kieran and Orlik, Philip V. and Hashimoto, Shigeru and Yuan, Jinhong},
- title = {Anomaly Detection and Diagnosis Using Pre-Processing and Time-Delay Autoencoder},
- booktitle = {IEEE International conference on emerging technologies and factory automation},
- year = 2021,
- month = sep,
- url = {https://www.merl.com/publications/TR2021-107}
- }
- Hori, T., Moritz, N., Hori, C., Le Roux, J., "Advanced Long-context End-to-end Speech Recognition Using Context-expanded Transformers", Interspeech, DOI: 10.21437/Interspeech.2021-1643, August 2021, pp. 2097-2101.
BibTeX TR2021-100 PDF- @inproceedings{Hori2021aug3,
- author = {Hori, Takaaki and Moritz, Niko and Hori, Chiori and Le Roux, Jonathan},
- title = {Advanced Long-context End-to-end Speech Recognition Using Context-expanded Transformers},
- booktitle = {Interspeech},
- year = 2021,
- pages = {2097--2101},
- month = aug,
- doi = {10.21437/Interspeech.2021-1643},
- url = {https://www.merl.com/publications/TR2021-100}
- }
- Hori, C., Hori, T., Le Roux, J., "Optimizing Latency for Online Video Captioning Using Audio-VisualTransformers", Interspeech, DOI: 10.21437/Interspeech.2021-1975, August 2021, pp. 586–590.
BibTeX TR2021-093 PDF- @inproceedings{Hori2021aug2,
- author = {Hori, Chiori and Hori, Takaaki and Le Roux, Jonathan},
- title = {Optimizing Latency for Online Video Captioning Using Audio-VisualTransformers},
- booktitle = {Interspeech},
- year = 2021,
- pages = {586–590},
- month = aug,
- publisher = {ISCA},
- doi = {10.21437/Interspeech.2021-1975},
- url = {https://www.merl.com/publications/TR2021-093}
- }
- Moritz, N., Hori, T., Le Roux, J., "Dual Causal/Non-Causal Self-Attention for Streaming End-to-End Speech Recognition", Interspeech, DOI: 10.21437/Interspeech.2021-1693, August 2021, pp. 1822-1826.
BibTeX TR2021-094 PDF- @inproceedings{Moritz2021aug,
- author = {Moritz, Niko and Hori, Takaaki and Le Roux, Jonathan},
- title = {Dual Causal/Non-Causal Self-Attention for Streaming End-to-End Speech Recognition},
- booktitle = {Interspeech},
- year = 2021,
- pages = {1822--1826},
- month = aug,
- doi = {10.21437/Interspeech.2021-1693},
- url = {https://www.merl.com/publications/TR2021-094}
- }
- Kojima, K., Koike-Akino, T., Tang, Y., Wang, Y., "Inverse design for integrated photonics using deep neural network", Integrated Photonics Research, Silicon and Nanophotonics (IPR), DOI: 10.1364/IPRSN.2021.IF3A.6, July 2021.
BibTeX TR2021-061 PDF- @inproceedings{Kojima2021jul,
- author = {Kojima, Keisuke and Koike-Akino, Toshiaki and Tang, Yingheng and Wang, Ye},
- title = {Inverse design for integrated photonics using deep neural network},
- booktitle = {Integrated Photonics Research, Silicon and Nanophotonics (IPR)},
- year = 2021,
- month = jul,
- doi = {10.1364/IPRSN.2021.IF3A.6},
- url = {https://www.merl.com/publications/TR2021-061}
- }
- Wang, Y., Aeron, S., Rakin, A.S., Koike-Akino, T., Moulin, P., "Robust Machine Learning via Privacy/Rate-Distortion Theory", IEEE International Symposium on Information Theory (ISIT), DOI: 10.1109/ISIT45174.2021.9517751, July 2021.
BibTeX TR2021-082 PDF Video Presentation- @inproceedings{Wang2021jul,
- author = {Wang, Ye and Aeron, Shuchin and Rakin, Adnan S and Koike-Akino, Toshiaki and Moulin, Pierre},
- title = {Robust Machine Learning via Privacy/Rate-Distortion Theory},
- booktitle = {IEEE International Symposium on Information Theory (ISIT)},
- year = 2021,
- month = jul,
- publisher = {IEEE},
- doi = {10.1109/ISIT45174.2021.9517751},
- isbn = {978-1-5386-8210-4},
- url = {https://www.merl.com/publications/TR2021-082}
- }
- Cherian, A., Wang, J., "Generalized One-Class Learning Using Pairs of Complementary Classifiers", IEEE Transactions on Pattern Analysis and Machine Intelligence, DOI: 10.1109/TPAMI.2021.3092999, June 2021.
BibTeX TR2021-076 PDF Software- @article{Cherian2021jun,
- author = {Cherian, Anoop and Wang, Jue},
- title = {Generalized One-Class Learning Using Pairs of Complementary Classifiers},
- journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence},
- year = 2021,
- month = jun,
- doi = {10.1109/TPAMI.2021.3092999},
- url = {https://www.merl.com/publications/TR2021-076}
- }
- Hori, C., "Human Perspective Scene Understanding via Multimodal Sensing," Tech. Rep. TR2022-151, Audio-Visual Scene Understanding Tutorial at CVPR 2021, June 2021.
BibTeX TR2022-151 PDF Video- @techreport{Hori2021jun,
- author = {Hori, Chiori},
- title = {Human Perspective Scene Understanding via Multimodal Sensing},
- institution = {Mitsubishi Electric Research Laboratories},
- year = 2021,
- month = jun,
- url = {https://www.merl.com/publications/TR2022-151}
- }
- Raychaudhuri, D.S., van Baar, J., Paul, S., Roy-Chowdhury, A.K., "Cross-domain Imitation from Observations", International Conference on Machine Learning (ICML), June 2021.
BibTeX TR2021-074 PDF- @inproceedings{Raychaudhuri2021jun,
- author = {Raychaudhuri, Dripta S. and van Baar, Jeroen and Paul, Sujoy and Roy-Chowdhury, Amit K.},
- title = {Cross-domain Imitation from Observations},
- booktitle = {International Conference on Machine Learning (ICML)},
- year = 2021,
- month = jun,
- url = {https://www.merl.com/publications/TR2021-074}
- }
- Moritz, N., Hori, T., Le Roux, J., "Capturing Multi-Resolution Context by Dilated Self-Attention", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP39728.2021.9415001, June 2021, pp. 5869-5873.
BibTeX TR2021-036 PDF- @inproceedings{Moritz2021jun,
- author = {Moritz, Niko and Hori, Takaaki and Le Roux, Jonathan},
- title = {Capturing Multi-Resolution Context by Dilated Self-Attention},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2021,
- pages = {5869--5873},
- month = jun,
- doi = {10.1109/ICASSP39728.2021.9415001},
- url = {https://www.merl.com/publications/TR2021-036}
- }
- Chen, S., Eldar, Y., "Time-Varying Graph Signal Inpainting via Unrolling Networks", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP39728.2021.9413406, June 2021.
BibTeX TR2021-070 PDF- @inproceedings{Chen2021jun,
- author = {Chen, Siheng and Eldar, Yonina},
- title = {Time-Varying Graph Signal Inpainting via Unrolling Networks},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2021,
- month = jun,
- doi = {10.1109/ICASSP39728.2021.9413406},
- url = {https://www.merl.com/publications/TR2021-070}
- }
- Chen, S., Eldar, Y., "Graph Signaling Denoising via Unrolling Networks", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP39728.2021.9415073, June 2021.
BibTeX TR2021-071 PDF- @inproceedings{Chen2021jun3,
- author = {Chen, Siheng and Eldar, Yonina},
- title = {Graph Signaling Denoising via Unrolling Networks},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2021,
- month = jun,
- doi = {10.1109/ICASSP39728.2021.9415073},
- url = {https://www.merl.com/publications/TR2021-071}
- }
- Hung, Y.-N., Wichern, G., Le Roux, J., "Transcription Is All You Need: Learning to Separate Musical Mixtures with Score as Supervision", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP39728.2021.9413358, June 2021, pp. 46-50.
BibTeX TR2021-069 PDF- @inproceedings{Hung2021jun,
- author = {Hung, Yun-Ning and Wichern, Gordon and Le Roux, Jonathan},
- title = {Transcription Is All You Need: Learning to Separate Musical Mixtures with Score as Supervision},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2021,
- pages = {46--50},
- month = jun,
- doi = {10.1109/ICASSP39728.2021.9413358},
- issn = {2379-190X},
- isbn = {978-1-7281-7605-5},
- url = {https://www.merl.com/publications/TR2021-069}
- }
- Khurana, S., Moritz, N., Hori, T., Le Roux, J., "Unsupervised Domain Adaptation For Speech Recognition via Uncertainty Driven Self-Training", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP39728.2021.9414299, June 2021, pp. 6553-6557.
BibTeX TR2021-039 PDF- @inproceedings{Khurana2021jun,
- author = {Khurana, Sameer and Moritz, Niko and Hori, Takaaki and Le Roux, Jonathan},
- title = {Unsupervised Domain Adaptation For Speech Recognition via Uncertainty Driven Self-Training},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2021,
- pages = {6553--6557},
- month = jun,
- doi = {10.1109/ICASSP39728.2021.9414299},
- url = {https://www.merl.com/publications/TR2021-039}
- }
- Moritz, N., Hori, T., Le Roux, J., "Semi-Supervised Speech Recognition via Graph-Based Temporal Classification", IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), DOI: 10.1109/ICASSP39728.2021.9414058, June 2021, pp. 6548-6552.
BibTeX TR2021-037 PDF- @inproceedings{Moritz2021jun2,
- author = {Moritz, Niko and Hori, Takaaki and Le Roux, Jonathan},
- title = {Semi-Supervised Speech Recognition via Graph-Based Temporal Classification},
- booktitle = {IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)},
- year = 2021,
- pages = {6548--6552},
- month = jun,
- doi = {10.1109/ICASSP39728.2021.9414058},
- url = {https://www.merl.com/publications/TR2021-037}
- }
- Watanabe, S., Boyer, F., Chang, X., Guo, P., Hayashi, T., Higuchi, Y., Hori, T., Huang, W.-C., Inaguma, H., Kamo, N., Shigeki, K., Li, C., Shi, J., Subramanian, A.S., Zhang, W., "The 2020 ESPNET Update: New Features, Broadened Applications, Performance Improvements, and Future Plans", IEEE Data Science and Learning Workshop (DSLW), DOI: 10.1109/DSLW51110, June 2021, pp. 1-6.
BibTeX TR2021-073 PDF- @inproceedings{Watanabe2021jun,
- author = {Watanabe, Shinji and Boyer, Florian and Chang, Xuankai and Guo, Pengcheng and Hayashi, Tomoki and Higuchi, Yosuke and Hori, Takaaki and Huang, Wen-Chin and Inaguma, Hirofumi and Kamo, Naoyuki and Shigeki, Karita and Li, Chenda and Shi, Jing and Subramanian, Aswin S and Zhang, Wangyou},
- title = {The 2020 ESPNET Update: New Features, Broadened Applications, Performance Improvements, and Future Plans},
- booktitle = {IEEE Data Science and Learning Workshop (DSLW)},
- year = 2021,
- pages = {1--6},
- month = jun,
- publisher = {IEEE},
- doi = {10.1109/DSLW51110},
- isbn = {978-1-6654-2826-2},
- url = {https://www.merl.com/publications/TR2021-073}
- }
- Kim, S., Galley, M., Gunasekara, C., Lee, S., Atkinson, A., Peng, B., Schulz, H., Gao, J., Li, J., Adada, M., Huang, M., Lastras, L., Kummerfeld, J.K., Lasecki, W.S., Hori, C., Cherian, A., Marks, T.K., Rastogi, A., Zang, X., Sunkara, S., Gupta, R., "Overview of the Eighth Dialog System Technology Challenge: DSTC8", IEEE/ACM Transactions on Audio, Speech, and Language Processing, DOI: 10.1109/TASLP.2021.3078368, May 2021.
BibTeX TR2021-064 PDF- @article{Kim2021may,
- author = {Kim, Seokhwan and Galley, Michel and Gunasekara, Chulaka and Lee, Sungjin and Atkinson, Adam and Peng, Baolin and Schulz, Hannes and Gao, Jianfeng and Li, Jinchao and Adada, Mahmoud and Huang, Minlie and Lastras, Luis and Kummerfeld, Jonathan K. and Lasecki, Walter S. and Hori, Chiori and Cherian, Anoop and Marks, Tim K. and Rastogi, Abhinav and Zang, Xiaoxue and Sunkara, Srinivas and Gupta, Raghav},
- title = {Overview of the Eighth Dialog System Technology Challenge: DSTC8},
- journal = {IEEE/ACM Transactions on Audio, Speech, and Language Processing},
- year = 2021,
- month = may,
- doi = {10.1109/TASLP.2021.3078368},
- issn = {2329-9290},
- url = {https://www.merl.com/publications/TR2021-064}
- }
- Hori, C., Tsuchiya, M., Chen, S., Cherian, A., Hori, T., Harsham, B.A., Marks, T.K., Le Roux, J., Sullivan, A., Vetro, A., "マルチモーダルセンシング情報に基づくScene-aware Interaction 技術", Society of Automotive Engineers of Japan, Vol. 75, No. 5, pp. 66-71, May 2021.
BibTeX TR2021-042 PDF Video- @article{Hori2021may,
- author = {Hori, Chiori and Tsuchiya, Masato and Chen, Siheng and Cherian, Anoop and Hori, Takaaki and Harsham, Bret A. and Marks, Tim K. and Le Roux, Jonathan and Sullivan, Alan and Vetro, Anthony},
- title = {マルチモーダルセンシング情報に基づくScene-aware Interaction 技術},
- journal = {Society of Automotive Engineers of Japan},
- year = 2021,
- volume = 75,
- number = 5,
- pages = {66--71},
- month = may,
- url = {https://www.merl.com/publications/TR2021-042}
- }
- Pan, C., Chen, S., Ortega, A., "Spatio-Temporal Graph Scattering Transform", International Conference on Learning Representations (ICLR), May 2021.
BibTeX TR2021-044 PDF- @inproceedings{Pan2021may,
- author = {Pan, Chao and Chen, Siheng and Ortega, Antonio},
- title = {Spatio-Temporal Graph Scattering Transform},
- booktitle = {International Conference on Learning Representations (ICLR)},
- year = 2021,
- month = may,
- url = {https://www.merl.com/publications/TR2021-044}
- }
- Han, M., Ozdenizci, O., Koike-Akino, T., Wang, Y., Erdogmus, D., "Universal Physiological Representation Learning with Soft-Disentangled Rateless Autoencoders", IEEE Journal of Biomedical and Health Informatics, DOI: 10.1109/JBHI.2021.3062335, Vol. 25, No. 8, pp. 2928-2937, April 2021.
BibTeX TR2021-027 PDF- @article{Han2021apr,
- author = {Han, Mo and Ozdenizci, Ozan and Koike-Akino, Toshiaki and Wang, Ye and Erdogmus, Deniz},
- title = {Universal Physiological Representation Learning with Soft-Disentangled Rateless Autoencoders},
- journal = {IEEE Journal of Biomedical and Health Informatics},
- year = 2021,
- volume = 25,
- number = 8,
- pages = {2928--2937},
- month = apr,
- doi = {10.1109/JBHI.2021.3062335},
- issn = {2168-2208},
- url = {https://www.merl.com/publications/TR2021-027}
- }
- Ramachandra, B., Jones, M.J., Vatsavai, R., "Perceptual Metric Learning for Video Anomaly Detection", Machine Vision and Applications, DOI: 0.1007/s00138-021-01187-5, Vol. 32, No. 63, pp. 1-18, March 2021.
BibTeX TR2021-028 PDF- @article{Ramachandra2021mar,
- author = {Ramachandra, Bharathkumar and Jones, Michael J. and Vatsavai, Ranga},
- title = {Perceptual Metric Learning for Video Anomaly Detection},
- journal = {Machine Vision and Applications},
- year = 2021,
- volume = 32,
- number = 63,
- pages = {1--18},
- month = mar,
- doi = {0.1007/s00138-021-01187-5},
- url = {https://www.merl.com/publications/TR2021-028}
- }
- Demir, A., Koike-Akino, T., Wang, Y., Erdogmus, D., "AutoBayes: Automated Bayesian Graph Exploration for Nuisance-Robust Inference", IEEE Access, DOI: 10.1109/ACCESS.2021.3064530, Vol. 9, pp. 39955-39972, March 2021.
BibTeX TR2021-016 PDF Presentation- @article{Demir2021mar,
- author = {Demir, Andac and Koike-Akino, Toshiaki and Wang, Ye and Erdogmus, Deniz},
- title = {AutoBayes: Automated Bayesian Graph Exploration for Nuisance-Robust Inference},
- journal = {IEEE Access},
- year = 2021,
- volume = 9,
- pages = {39955--39972},
- month = mar,
- doi = {10.1109/ACCESS.2021.3064530},
- issn = {2169-3536},
- url = {https://www.merl.com/publications/TR2021-016}
- }
- Kojima, K., Tang, Y., Koike-Akino, T., Wang, Y., Jha, D.K., TaherSima, M., Parsons, K., "Application of Deep Learning for Nanophotonic Device Design", SPIE Photonics West, Bahram Jalali and Ken-ichi Kitayama, Eds., DOI: 10.1117/12.2579104, March 2021.
BibTeX TR2020-182 PDF Video- @inproceedings{Kojima2021mar,
- author = {Kojima, Keisuke and Tang, Yingheng and Koike-Akino, Toshiaki and Wang, Ye and Jha, Devesh K. and TaherSima, Mohammad and Parsons, Kieran},
- title = {Application of Deep Learning for Nanophotonic Device Design},
- booktitle = {SPIE Photonics West},
- year = 2021,
- editor = {Bahram Jalali and Ken-ichi Kitayama},
- month = mar,
- publisher = {SPIE},
- doi = {10.1117/12.2579104},
- url = {https://www.merl.com/publications/TR2020-182}
- }
- Geng, S., Gao, P., Chatterjee, M., Hori, C., Le Roux, J., Zhang, Y., Li, H., Cherian, A., "Dynamic Graph Representation Learning for Video Dialog via Multi-Modal Shuffled Transformers", AAAI Conference on Artificial Intelligence, February 2021, pp. 1415-1423.
BibTeX TR2021-010 PDF- @inproceedings{Geng2021feb,
- author = {Geng, Shijie and Gao, Peng and Chatterjee, Moitreya and Hori, Chiori and Le Roux, Jonathan and Zhang, Yongfeng and Li, Hongsheng and Cherian, Anoop},
- title = {Dynamic Graph Representation Learning for Video Dialog via Multi-Modal Shuffled Transformers},
- booktitle = {AAAI Conference on Artificial Intelligence},
- year = 2021,
- pages = {1415--1423},
- month = feb,
- publisher = {AAAI Press, Palo Alto, California USA},
- isbn = {978-1-57735-866-4},
- url = {https://www.merl.com/publications/TR2021-010}
- }