From 160381d9ddbd2cd9355159551bd44e8c102d8964 Mon Sep 17 00:00:00 2001 From: JamesZhutheThird <35760593+JamesZhutheThird@users.noreply.github.com> Date: Sun, 26 May 2024 02:57:06 +0000 Subject: [PATCH] =?UTF-8?q?Deploying=20to=20gh-pages=20from=20@=20X-LANCE/?= =?UTF-8?q?x-lance.github.io@37b86b5455a61126ea12e12dbfcd812c09177a0f=20?= =?UTF-8?q?=F0=9F=9A=80?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- 404.html | 2 +- _pages/en/members/index.html | 2 +- _pages/en/under_construction/index.html | 2 +- assets/jupyter/blog.ipynb.html | 2 +- blog/2015/code/index.html | 2 +- blog/2015/disqus-comments/index.html | 2 +- blog/2015/formatting-and-links/index.html | 2 +- blog/2015/images/index.html | 2 +- blog/2015/index.html | 2 +- blog/2015/math/index.html | 2 +- blog/2018/distill/index.html | 2 +- blog/2018/index.html | 2 +- blog/2020/github-metadata/index.html | 2 +- blog/2020/index.html | 2 +- blog/2020/twitter/index.html | 2 +- blog/2021/diagrams/index.html | 2 +- blog/2021/index.html | 2 +- blog/2022/giscus-comments/index.html | 2 +- blog/2022/index.html | 2 +- blog/2022/redirect/index.html | 2 +- blog/2023/audios/index.html | 2 +- blog/2023/custom-blockquotes/index.html | 2 +- blog/2023/index.html | 2 +- blog/2023/jupyter-notebook/index.html | 2 +- blog/2023/post-bibliography/index.html | 2 +- blog/2023/sidebar-table-of-contents/index.html | 2 +- blog/2023/table-of-contents/index.html | 2 +- blog/2023/tables/index.html | 2 +- blog/2023/tikzjax/index.html | 2 +- blog/2023/videos/index.html | 2 +- blog/2024/advanced-images/index.html | 2 +- blog/2024/chartjs/index.html | 2 +- blog/2024/code-diff/index.html | 2 +- blog/2024/echarts/index.html | 2 +- blog/2024/geojson-map/index.html | 2 +- blog/2024/index.html | 2 +- blog/2024/vega-lite/index.html | 2 +- blog/category/external-services/index.html | 2 +- blog/category/sample-posts/index.html | 2 +- blog/index.html | 2 +- blog/page/2/index.html | 2 +- blog/page/3/index.html | 2 +- blog/page/4/index.html | 2 +- blog/page/5/index.html | 2 +- blog/page/6/index.html | 2 +- blog/tag/audios/index.html | 2 +- blog/tag/bib/index.html | 2 +- blog/tag/blockquotes/index.html | 2 +- blog/tag/charts/index.html | 2 +- blog/tag/code/index.html | 2 +- blog/tag/comments/index.html | 2 +- blog/tag/diagrams/index.html | 2 +- blog/tag/distill/index.html | 2 +- blog/tag/formatting/index.html | 2 +- blog/tag/images/index.html | 2 +- blog/tag/jupyter/index.html | 2 +- blog/tag/links/index.html | 2 +- blog/tag/maps/index.html | 2 +- blog/tag/math/index.html | 2 +- blog/tag/metadata/index.html | 2 +- blog/tag/sidebar/index.html | 2 +- blog/tag/tables/index.html | 2 +- blog/tag/toc/index.html | 2 +- blog/tag/videos/index.html | 2 +- cv/index.html | 2 +- feed.xml | 2 +- index.html | 2 +- members/alumni/index.html | 2 +- members/faculty/index.html | 2 +- members/student/index.html | 2 +- news/announcement_1/index.html | 2 +- news/announcement_2/index.html | 2 +- news/announcement_3/index.html | 2 +- news/announcement_4/index.html | 2 +- news/announcement_5/index.html | 2 +- news/announcement_6/index.html | 2 +- news/announcement_7/index.html | 2 +- news/announcement_8/index.html | 2 +- news/announcement_9/index.html | 2 +- news/index.html | 2 +- papers/index.html | 2 +- projects/1_project/index.html | 2 +- projects/2_project/index.html | 2 +- projects/3_project/index.html | 2 +- projects/4_project/index.html | 2 +- projects/5_project/index.html | 2 +- projects/6_project/index.html | 2 +- projects/index.html | 2 +- repositories/index.html | 2 +- sitemap.xml | 2 +- teaching/index.html | 2 +- zh/404.html | 2 +- zh/_pages/zh/members/index.html | 2 +- zh/_pages/zh/under_construction/index.html | 2 +- zh/blog/2015/code/index.html | 2 +- zh/blog/2015/disqus-comments/index.html | 2 +- zh/blog/2015/formatting-and-links/index.html | 2 +- zh/blog/2015/images/index.html | 2 +- zh/blog/2015/index.html | 2 +- zh/blog/2015/math/index.html | 2 +- zh/blog/2018/distill/index.html | 2 +- zh/blog/2018/index.html | 2 +- zh/blog/2020/github-metadata/index.html | 2 +- zh/blog/2020/index.html | 2 +- zh/blog/2020/twitter/index.html | 2 +- zh/blog/2021/diagrams/index.html | 2 +- zh/blog/2021/index.html | 2 +- zh/blog/2022/giscus-comments/index.html | 2 +- zh/blog/2022/index.html | 2 +- zh/blog/2022/redirect/index.html | 2 +- zh/blog/2023/audios/index.html | 2 +- zh/blog/2023/custom-blockquotes/index.html | 2 +- zh/blog/2023/index.html | 2 +- zh/blog/2023/jupyter-notebook/index.html | 2 +- zh/blog/2023/post-bibliography/index.html | 2 +- zh/blog/2023/sidebar-table-of-contents/index.html | 2 +- zh/blog/2023/table-of-contents/index.html | 2 +- zh/blog/2023/tables/index.html | 2 +- zh/blog/2023/tikzjax/index.html | 2 +- zh/blog/2023/videos/index.html | 2 +- zh/blog/2024/advanced-images/index.html | 2 +- zh/blog/2024/chartjs/index.html | 2 +- zh/blog/2024/code-diff/index.html | 2 +- zh/blog/2024/echarts/index.html | 2 +- zh/blog/2024/geojson-map/index.html | 2 +- zh/blog/2024/index.html | 2 +- zh/blog/2024/vega-lite/index.html | 2 +- zh/blog/category/external-services/index.html | 2 +- zh/blog/category/sample-posts/index.html | 2 +- zh/blog/index.html | 2 +- zh/blog/page/2/index.html | 2 +- zh/blog/page/3/index.html | 2 +- zh/blog/page/4/index.html | 2 +- zh/blog/page/5/index.html | 2 +- zh/blog/page/6/index.html | 2 +- zh/blog/tag/audios/index.html | 2 +- zh/blog/tag/bib/index.html | 2 +- zh/blog/tag/blockquotes/index.html | 2 +- zh/blog/tag/charts/index.html | 2 +- zh/blog/tag/code/index.html | 2 +- zh/blog/tag/comments/index.html | 2 +- zh/blog/tag/diagrams/index.html | 2 +- zh/blog/tag/distill/index.html | 2 +- zh/blog/tag/formatting/index.html | 2 +- zh/blog/tag/images/index.html | 2 +- zh/blog/tag/jupyter/index.html | 2 +- zh/blog/tag/links/index.html | 2 +- zh/blog/tag/maps/index.html | 2 +- zh/blog/tag/math/index.html | 2 +- zh/blog/tag/metadata/index.html | 2 +- zh/blog/tag/sidebar/index.html | 2 +- zh/blog/tag/tables/index.html | 2 +- zh/blog/tag/toc/index.html | 2 +- zh/blog/tag/videos/index.html | 2 +- zh/cv/index.html | 2 +- zh/feed.xml | 2 +- zh/index.html | 2 +- zh/members/alumni/index.html | 2 +- zh/members/faculty/index.html | 2 +- zh/members/student/index.html | 2 +- zh/news/announcement_1/index.html | 2 +- zh/news/announcement_2/index.html | 2 +- zh/news/announcement_3/index.html | 2 +- zh/news/announcement_4/index.html | 2 +- zh/news/announcement_5/index.html | 2 +- zh/news/announcement_6/index.html | 2 +- zh/news/announcement_7/index.html | 2 +- zh/news/announcement_8/index.html | 2 +- zh/news/announcement_9/index.html | 2 +- zh/news/index.html | 2 +- zh/papers/index.html | 2 +- zh/projects/1_project/index.html | 2 +- zh/projects/2_project/index.html | 2 +- zh/projects/3_project/index.html | 2 +- zh/projects/4_project/index.html | 2 +- zh/projects/5_project/index.html | 2 +- zh/projects/6_project/index.html | 2 +- zh/projects/index.html | 2 +- zh/repositories/index.html | 2 +- zh/sitemap.xml | 2 +- zh/teaching/index.html | 2 +- 181 files changed, 181 insertions(+), 181 deletions(-) diff --git a/404.html b/404.html index 4e5bd8f879f6..b77d42395fd7 100644 --- a/404.html +++ b/404.html @@ -1 +1 @@ - Page not found | X - LANCE

Page not found

Looks like there has been a mistake. Nothing exists here.

You will be redirected to the main page within 3 seconds. If not redirected, please go back to the home page.

\ No newline at end of file + Page not found | X - LANCE

Page not found

Looks like there has been a mistake. Nothing exists here.

You will be redirected to the main page within 3 seconds. If not redirected, please go back to the home page.

\ No newline at end of file diff --git a/_pages/en/members/index.html b/_pages/en/members/index.html index e4c1635ceed1..90e296f74dd3 100644 --- a/_pages/en/members/index.html +++ b/_pages/en/members/index.html @@ -1 +1 @@ - 🙌Members | X - LANCE

🙌Members

\ No newline at end of file + 🙌Members | X - LANCE

🙌Members

\ No newline at end of file diff --git a/_pages/en/under_construction/index.html b/_pages/en/under_construction/index.html index 0d5f482f1b0f..61c4bbdf3a46 100644 --- a/_pages/en/under_construction/index.html +++ b/_pages/en/under_construction/index.html @@ -1 +1 @@ - 🛠️Under Construction | X - LANCE

🛠️Under Construction

\ No newline at end of file + 🛠️Under Construction | X - LANCE

🛠️Under Construction

\ No newline at end of file diff --git a/assets/jupyter/blog.ipynb.html b/assets/jupyter/blog.ipynb.html index 30746a64562d..0147f8cff94e 100644 --- a/assets/jupyter/blog.ipynb.html +++ b/assets/jupyter/blog.ipynb.html @@ -1,4 +1,4 @@ - jekyll-jupyter-notebook20240526-1914-jcdlma

PhD Candidates

Chenpeng Du
078-P
Hongshen Xu
091-P
Zihan Zhao
106-P
Danyang Zhang
112-P
Yu Xi
107-P
Xuenan Xu
098-M
Tao Liu
129-P
Ruisheng Cao
084-M
Ziyang Ma
151-P
Da Ma
094-M
Situo Zhang
140-P
Hankun Wang
150-P
Junzhe Liu
160-P
Zichen Zhu
146-UP
Yifan Yang
171-P
Pengyu Wang
145-P
Kunyao Lan
131-MP
Yang Han
166-P
Yiwei Guo
158-P
Jiaming Luo
147-P
Xiujie Song
164-P

Master Candidates

Yuncong Liu
133-P
Ganyu Huang
Jianheng Zhuo
148-M
Hanchong Zhang
165-M
Zeyu Xie
138-U
Zheshu Song
154-M
Liangtai Sun
170-M
Hanqi Li
169-M
Jingpiao Li
168-M
Chaofan He
172-M
Yushen Chen
Siyuan Chen
149-M
Hongchuan Ceng
Guanrou Yang
153-M
Fei Yang
Xiaohang Xu
139-M
Yunchong Xiao
162-M
Yakun Song
Yuezhang Peng
Yijie Luo
Gewei Lu
143-M
Junjie Li
152-M
Haoyu Li
159-M
Senyu Han
167-M
Xingyuan Li
172-M
Yaoyun Zhang

Undergraduates

Baihan Li
157-U
Hanglei Zhang
Chenrun Wang
Xizhuo Zhang
Baocai Chen
Zhennan Shen
Qi Chen
142-U
Yaozhong Zhang
Wenxi Chen
Chen Yang
141-U
Zhisheng Zheng
Yanqiao Zhu
Hang Zheng
Zhikang Niu
Danyu Luo
144-U
Qixi Zheng
Bohan Li
Xuancheng Liu
Zhihan Li
Yuzhe Liang
Yiheng Chen
Zhengshun Xia
Ding Zhou
Xiquan Li
Xinming Shu
Haoxiang Jiang
Ruiyang Xu
Yifan Zhang
Sijia Guo
Bingrui Jin
Tianxi Wan
Yixiao Wang
Wen Wen
\ No newline at end of file + Students | X - LANCE

Students

Students of X-LANCE

PhD Candidates

Chenpeng Du
078-P
Hongshen Xu
091-P
Zihan Zhao
106-P
Danyang Zhang
112-P
Yu Xi
107-P
Xuenan Xu
098-M
Tao Liu
129-P
Ruisheng Cao
084-M
Ziyang Ma
151-P
Da Ma
094-M
Situo Zhang
140-P
Hankun Wang
150-P
Junzhe Liu
160-P
Zichen Zhu
146-UP
Yifan Yang
171-P
Pengyu Wang
145-P
Kunyao Lan
131-MP
Yang Han
166-P
Yiwei Guo
158-P
Jiaming Luo
147-P
Xiujie Song
164-P

Master Candidates

Yuncong Liu
133-P
Ganyu Huang
Jianheng Zhuo
148-M
Hanchong Zhang
165-M
Zeyu Xie
138-U
Zheshu Song
154-M
Liangtai Sun
170-M
Hanqi Li
169-M
Jingpiao Li
168-M
Chaofan He
172-M
Yushen Chen
Siyuan Chen
149-M
Hongchuan Ceng
Guanrou Yang
153-M
Fei Yang
Xiaohang Xu
139-M
Yunchong Xiao
162-M
Yakun Song
Yuezhang Peng
Yijie Luo
Gewei Lu
143-M
Junjie Li
152-M
Haoyu Li
159-M
Senyu Han
167-M
Xingyuan Li
172-M
Yaoyun Zhang

Undergraduates

Baihan Li
157-U
Hanglei Zhang
Chenrun Wang
Xizhuo Zhang
Baocai Chen
Zhennan Shen
Qi Chen
142-U
Yaozhong Zhang
Wenxi Chen
Chen Yang
141-U
Zhisheng Zheng
Yanqiao Zhu
Hang Zheng
Zhikang Niu
Danyu Luo
144-U
Qixi Zheng
Bohan Li
Xuancheng Liu
Zhihan Li
Yuzhe Liang
Yiheng Chen
Zhengshun Xia
Ding Zhou
Xiquan Li
Xinming Shu
Haoxiang Jiang
Ruiyang Xu
Yifan Zhang
Sijia Guo
Bingrui Jin
Tianxi Wan
Yixiao Wang
Wen Wen
\ No newline at end of file diff --git a/news/announcement_1/index.html b/news/announcement_1/index.html index 1a835e4787ed..9d612ea985ec 100644 --- a/news/announcement_1/index.html +++ b/news/announcement_1/index.html @@ -1 +1 @@ - Announcement_1 | X - LANCE

Announcement_1

\ No newline at end of file + Announcement_1 | X - LANCE

Announcement_1

\ No newline at end of file diff --git a/news/announcement_2/index.html b/news/announcement_2/index.html index d71faa3caaa8..35d000a81857 100644 --- a/news/announcement_2/index.html +++ b/news/announcement_2/index.html @@ -1 +1 @@ - Announcement_2 | X - LANCE

Announcement_2

📃[Paper+3] Three papers from X-LANCE Lab accepted by AAAI 2024. [Post]

\ No newline at end of file + Announcement_2 | X - LANCE

Announcement_2

📃[Paper+3] Three papers from X-LANCE Lab accepted by AAAI 2024. [Post]

\ No newline at end of file diff --git a/news/announcement_3/index.html b/news/announcement_3/index.html index 22884e4e0e41..c1224fa70377 100644 --- a/news/announcement_3/index.html +++ b/news/announcement_3/index.html @@ -1 +1 @@ - Announcement_3 | X - LANCE

Announcement_3

📃[Paper+3] Three papers from X-LANCE Lab accepted by COLING 2024 and WSDM 2024. [Post]

\ No newline at end of file + Announcement_3 | X - LANCE

Announcement_3

📃[Paper+3] Three papers from X-LANCE Lab accepted by COLING 2024 and WSDM 2024. [Post]

\ No newline at end of file diff --git a/news/announcement_4/index.html b/news/announcement_4/index.html index ae09b9716228..316a138dd9a4 100644 --- a/news/announcement_4/index.html +++ b/news/announcement_4/index.html @@ -1 +1 @@ - Announcement_4 | X - LANCE

Announcement_4

📃[Paper+2] Two papers from X-LANCE Lab accepted by NAACL 2024. [Post]

\ No newline at end of file + Announcement_4 | X - LANCE

Announcement_4

📃[Paper+2] Two papers from X-LANCE Lab accepted by NAACL 2024. [Post]

\ No newline at end of file diff --git a/news/announcement_5/index.html b/news/announcement_5/index.html index 2308159698d2..162b036e1441 100644 --- a/news/announcement_5/index.html +++ b/news/announcement_5/index.html @@ -1 +1 @@ - Announcement_5 | X - LANCE

Announcement_5

🎆 [New Year Message] Together we celebrate the New Year! The 2024 Annual Dinner of X-LANCE was successfully held. [Post]

\ No newline at end of file + Announcement_5 | X - LANCE

Announcement_5

🎆 [New Year Message] Together we celebrate the New Year! The 2024 Annual Dinner of X-LANCE was successfully held. [Post]

\ No newline at end of file diff --git a/news/announcement_6/index.html b/news/announcement_6/index.html index 32246dfac3b9..15c8af59e47c 100644 --- a/news/announcement_6/index.html +++ b/news/announcement_6/index.html @@ -1 +1 @@ - Announcement_6 | X - LANCE

Announcement_6

🤗 [LLM+1] SJTU, AISpeech, and Suzhou Labs jointly released the first 10B scale large model in chemistry, with chemical capability outperforming GPT-4. [Post]

\ No newline at end of file + Announcement_6 | X - LANCE

Announcement_6

🤗 [LLM+1] SJTU, AISpeech, and Suzhou Labs jointly released the first 10B scale large model in chemistry, with chemical capability outperforming GPT-4. [Post]

\ No newline at end of file diff --git a/news/announcement_7/index.html b/news/announcement_7/index.html index 259103ba1376..23e005c9a975 100644 --- a/news/announcement_7/index.html +++ b/news/announcement_7/index.html @@ -1 +1 @@ - Announcement_7 | X - LANCE

Announcement_7

📃[Paper+2] Two papers from X-LANCE Lab accepted by ICML 2024. [Post]

\ No newline at end of file + Announcement_7 | X - LANCE

Announcement_7

📃[Paper+2] Two papers from X-LANCE Lab accepted by ICML 2024. [Post]

\ No newline at end of file diff --git a/news/announcement_8/index.html b/news/announcement_8/index.html index df93c07e3358..d1137170a70c 100644 --- a/news/announcement_8/index.html +++ b/news/announcement_8/index.html @@ -1 +1 @@ - Announcement_8 | X - LANCE

Announcement_8

📃[Paper+3] Three papers from X-LANCE Lab accepted by ACL 2024 main conference or findings of ACL. [Post]

\ No newline at end of file + Announcement_8 | X - LANCE

Announcement_8

📃[Paper+3] Three papers from X-LANCE Lab accepted by ACL 2024 main conference or findings of ACL. [Post]

\ No newline at end of file diff --git a/news/announcement_9/index.html b/news/announcement_9/index.html index 8a21154f2965..5a31d197e5f3 100644 --- a/news/announcement_9/index.html +++ b/news/announcement_9/index.html @@ -1 +1 @@ - Announcement_9 | X - LANCE

Announcement_9

🌄[PhD Conference] The 2024 PhD Conference was held in Anji, Zhejiang Province. [post]

\ No newline at end of file + Announcement_9 | X - LANCE

Announcement_9

🌄[PhD Conference] The 2024 PhD Conference was held in Anji, Zhejiang Province. [post]

\ No newline at end of file diff --git a/news/index.html b/news/index.html index 11860dc0f4be..363ddf6d823e 100644 --- a/news/index.html +++ b/news/index.html @@ -1 +1 @@ - 🔥News | X - LANCE

🔥News

May 18, 2024 🌄[PhD Conference] The 2024 PhD Conference was held in Anji, Zhejiang Province. [post]
May 16, 2024 📃[Paper+3] Three papers from X-LANCE Lab accepted by ACL 2024 main conference or findings of ACL. [Post]
May 02, 2024 📃[Paper+2] Two papers from X-LANCE Lab accepted by ICML 2024. [Post]
Apr 07, 2024 🤗 [LLM+1] SJTU, AISpeech, and Suzhou Labs jointly released the first 10B scale large model in chemistry, with chemical capability outperforming GPT-4. [Post]
Mar 14, 2024 📃[Paper+2] Two papers from X-LANCE Lab accepted by NAACL 2024. [Post]
Feb 29, 2024 📃[Paper+3] Three papers from X-LANCE Lab accepted by COLING 2024 and WSDM 2024. [Post]
Jan 24, 2024 🎆 [New Year Message] Together we celebrate the New Year! The 2024 Annual Dinner of X-LANCE was successfully held. [Post]
Dec 31, 2023 📃[Paper+3] Three papers from X-LANCE Lab accepted by AAAI 2024. [Post]
Dec 31, 2023 📃[Paper+14] Three papers from X-LANCE Lab accepted by ICASSP 2024. [Post1] [Post2]
\ No newline at end of file + 🔥News | X - LANCE

🔥News

May 18, 2024 🌄[PhD Conference] The 2024 PhD Conference was held in Anji, Zhejiang Province. [post]
May 16, 2024 📃[Paper+3] Three papers from X-LANCE Lab accepted by ACL 2024 main conference or findings of ACL. [Post]
May 02, 2024 📃[Paper+2] Two papers from X-LANCE Lab accepted by ICML 2024. [Post]
Apr 07, 2024 🤗 [LLM+1] SJTU, AISpeech, and Suzhou Labs jointly released the first 10B scale large model in chemistry, with chemical capability outperforming GPT-4. [Post]
Mar 14, 2024 📃[Paper+2] Two papers from X-LANCE Lab accepted by NAACL 2024. [Post]
Feb 29, 2024 📃[Paper+3] Three papers from X-LANCE Lab accepted by COLING 2024 and WSDM 2024. [Post]
Jan 24, 2024 🎆 [New Year Message] Together we celebrate the New Year! The 2024 Annual Dinner of X-LANCE was successfully held. [Post]
Dec 31, 2023 📃[Paper+3] Three papers from X-LANCE Lab accepted by AAAI 2024. [Post]
Dec 31, 2023 📃[Paper+14] Three papers from X-LANCE Lab accepted by ICASSP 2024. [Post1] [Post2]
\ No newline at end of file diff --git a/papers/index.html b/papers/index.html index 9256a0a077fa..26907459525f 100644 --- a/papers/index.html +++ b/papers/index.html @@ -1 +1 @@ - 📃Papers | X - LANCE

📃Papers

Publications are listed in reversed chronological order.

2024

  1. Advanced Long-Content Speech Recognition With Factorized Neural Transducer
    Xun Gong , Yu Wu , Jinyu Li , Shujie Liu , Rui Zhao , Xie Chen, and Yanmin Qian
    IEEE ACM Trans. Audio Speech Lang. Process., 2024
  2. EAT: Self-Supervised Pre-Training with Efficient Audio Transformer
    Wenxi Chen , Yuzhe Liang , Ziyang Ma , Zhisheng Zheng , and Xie Chen
    CoRR, 2024
  3. ELLA-V: Stable Neural Codec Language Modeling with Alignment-guided Sequence Reordering
    Yakun Song , Zhuo Chen , Xiaofei Wang , Ziyang Ma , and Xie Chen
    CoRR, 2024
  4. BAT: Learning to Reason about Spatial Sounds with Large Language Models
    Zhisheng Zheng , Puyuan Peng , Ziyang Ma , Xie Chen, Eunsol Choi , and David Harwath
    CoRR, 2024
  5. An Embarrassingly Simple Approach for LLM with Strong ASR Capacity
    Ziyang Ma , Guanrou Yang , Yifan Yang , Zhifu Gao , Jiaming Wang , Zhihao Du , Fan Yu , Qian Chen , Siqi Zheng , Shiliang Zhang , and Xie Chen
    CoRR, 2024
  6. Beyond the Status Quo: A Contemporary Survey of Advances and Challenges in Audio Captioning
    Xuenan Xu , Zeyu Xie , Mengyue Wu, and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., 2024
  7. Towards Weakly Supervised Text-to-Audio Grounding
    Xuenan Xu , Ziyang Ma , Mengyue Wu, and Kai Yu
    CoRR, 2024
  8. VALL-T: Decoder-Only Generative Transducer for Robust and Decoding-Controllable Text-to-Speech
    Chenpeng Du , Yiwei Guo , Hankun Wang , Yifan Yang , Zhikang Niu , Shuai Wang , Hui Zhang , Xie Chen, and Kai Yu
    CoRR, 2024
  9. ChemDFM: Dialogue Foundation Model for Chemistry
    Zihan Zhao , Da Ma , Lu Chen, Liangtai Sun , Zihao Li , Hongshen Xu , Zichen Zhu , Su Zhu , Shuai Fan , Guodong Shen , Xin Chen , and Kai Yu
    CoRR, 2024
  10. MULTI: Multimodal Understanding Leaderboard with Text and Images
    Zichen Zhu, Yang Xu , Lu Chen, Jingkai Yang , Yichuan Ma , Yiming Sun , Hailin Wen , Jiaqi Liu , Jinyu Cai , Yingzi Ma , Situo Zhang , Zihan Zhao , Liangtai Sun , and Kai Yu
    CoRR, 2024

2023

  1. A Unified Framework From Face Image Restoration to Data Augmentation Using Generative Prior
    Jiawei You , Ganyu Huang , Tianyuan Han , Haoze Yang , and Liping Shen
    IEEE Access, 2023
  2. Human Pose Estimation with Combined Feature Maps and Joint Embeddings
    Tianyuan Han , Ganyu Huang , Chunhui Li , and Liping Shen
    In Proceedings of the 2023 International Conference on Advances in Artificial Intelligence and Applications, AAIA 2023, Wuhan, China, November 18-20, 2023 , 2023
  3. Assessing and Enhancing LLMs: A Physics and History Dataset and One-More-Check Pipeline Method
    Chaofan He , Chunhui Li , Tianyuan Han , and Liping Shen
    In Neural Information Processing - 30th International Conference, ICONIP 2023, Changsha, China, November 20-23, 2023, Proceedings, Part XIII , 2023
  4. GAN Latent Space Manipulation Based Augmentation for Unbalanced Emotion Datasets
    Yuhan Xiong , Jiawei You , and Liping Shen
    In International Joint Conference on Neural Networks, IJCNN 2023, Gold Coast, Australia, June 18-23, 2023 , 2023
  5. LongFNT: Long-Form Speech Recognition with Factorized Neural Transducer
    Xun Gong , Yu Wu , Jinyu Li , Shujie Liu , Rui Zhao , Xie Chen, and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
  6. Factorized AED: Factorized Attention-Based Encoder-Decoder for Text-Only Domain Adaptive ASR
    Xun Gong , Wei Wang , Hang Shao , Xie Chen, and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
  7. Exploring Binary Classification Loss for Speaker Verification
    Bing Han , Zhengyang Chen , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
  8. Improving Dino-Based Self-Supervised Speaker Verification with Progressive Cluster-Aware Training
    Bing Han , Wen Huang , Zhengyang Chen , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2023 - Workshops, Rhodes Island, Greece, June 4-10, 2023 , 2023
  9. Robust Audio-Visual ASR with Unified Cross-Modal Attention
    Jiahong Li , Chenda Li , Yifei Wu , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
  10. Target Sound Extraction with Variable Cross-Modality Clues
    Chenda Li , Yao Qian , Zhuo Chen , Dongmei Wang , Takuya Yoshioka , Shujie Liu , Yanmin Qian , and Michael Zeng
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
  11. Predictive Skim: Contrastive Predictive Coding for Low-Latency Online Speech Separation
    Chenda Li , Yifei Wu , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
  12. Multi-Speaker End-to-End Multi-Modal Speaker Diarization System for the MISP 2022 Challenge
    Tao Liu , Zhengyang Chen , Yanmin Qian , and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
  13. Joint Discriminator and Transfer Based Fast Domain Adaptation For End-To-End Speech Recognition
    Hang Shao , Tian Tan , Wei Wang , Xun Gong , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
  14. Lowbit Neural Network Quantization for Speaker Verification
    Haoyu Wang , Bei Liu , Yifei Wu , Zhengyang Chen , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2023 - Workshops, Rhodes Island, Greece, June 4-10, 2023 , 2023
  15. Wespeaker: A Research and Production Oriented Speaker Embedding Learning Toolkit
    Hongji Wang , Chengdong Liang , Shuai Wang , Zhengyang Chen , Binbin Zhang , Xu Xiang , Yanlei Deng , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
  16. HuBERT-AGG: Aggregated Representation Distillation of Hidden-Unit Bert for Robust Speech Recognition
    Wei Wang , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
  17. Light-Weight Visualvoice: Neural Network Quantization On Audio Visual Speech Separation
    Yifei Wu , Chenda Li , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2023 - Workshops, Rhodes Island, Greece, June 4-10, 2023 , 2023
  18. Code-Switching Text Generation and Injection in Mandarin-English ASR
    Haibin Yu , Yuxuan Hu , Yao Qian , Ma Jin , Linquan Liu , Shujie Liu , Yu Shi , Yanmin Qian , Edward Lin , and Michael Zeng
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
  19. Adaptive Large Margin Fine-Tuning For Robust Speaker Verification
    Leying Zhang , Zhengyang Chen , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
  20. ComSL: A Composite Speech-Language Model for End-to-End Speech-to-Text Translation
    Chenyang Le , Yao Qian , Long Zhou , Shujie Liu , Yanmin Qian , Michael Zeng , and Xuedong Huang
    In Advances in Neural Information Processing Systems 36: Annual Conference on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans, LA, USA, December 10 - 16, 2023 , 2023
  21. Exploring the Integration of Speech Separation and Recognition with Self-Supervised Learning Representation
    Yoshiki Masuyama , Xuankai Chang , Wangyou Zhang , Samuele Cornell , Zhong-Qiu Wang , Nobutaka Ono , Yanmin Qian , and Shinji Watanabe
    In IEEE Workshop on Applications of Signal Processing to Audio and Acoustics, WASPAA 2023, New Paltz, NY, USA, October 22-25, 2023 , 2023
  22. Software Design and User Interface of ESPnet-SE++: Speech Enhancement for Robust Speech Processing (espnet-v.202310) (Version 1)
    Yen-Ju Lu , Xuankai Chang , Chenda Li , Wangyou Zhang , Samuele Cornell , Zhaoheng Ni , Yoshiki Masuyama , Brian Yan , Robin Scheibler , Zhong-Qiu Wang , Yu Tsao , Yanmin Qian , and Shinji Watanabe
    Oct 2023
    Accessed on YYYY-MM-DD.
  23. Self-Supervised Learning with Cluster-Aware-DINO for High-Performance Robust Speaker Verification
    Bing Han , Zhengyang Chen , and Yanmin Qian
    CoRR, Oct 2023
  24. Attention-based Encoder-Decoder Network for End-to-End Neural Speaker Diarization with Target Speaker Attractor
    Zhengyang Chen , Bing Han , Shuai Wang , and Yanmin Qian
    CoRR, Oct 2023
  25. Whisper-KDQ: A Lightweight Whisper via Guided Knowledge Distillation and Quantization for Efficient ASR
    Hang Shao , Wei Wang , Bei Liu , Xun Gong , Haoyu Wang , and Yanmin Qian
    CoRR, Oct 2023
  26. Weakly-Supervised Speech Pre-training: A Case Study on Target Speech Recognition
    Wangyou Zhang , and Yanmin Qian
    CoRR, Oct 2023
  27. Adapting Multi-Lingual ASR Models for Handling Multiple Talkers
    Chenda Li , Yao Qian , Zhuo Chen , Naoyuki Kanda , Dongmei Wang , Takuya Yoshioka , Yanmin Qian , and Michael Zeng
    CoRR, Oct 2023
  28. InstructME: An Instruction Guided Music Edit And Remix Framework with Latent Diffusion Models
    Bing Han , Junyu Dai , Xuchen Song , Weituo Hao , Xinyan He , Dong Guo , Jitong Chen , Yuxuan Wang , and Yanmin Qian
    CoRR, Oct 2023
  29. Attention-based Encoder-Decoder End-to-End Neural Diarization with Embedding Enhancer
    Zhengyang Chen , Bing Han , Shuai Wang , and Yanmin Qian
    CoRR, Oct 2023
  30. USED: Universal Speaker Extraction and Diarization
    Junyi Ao , Mehmet Sinan Yildirim , Meng Ge , Shuai Wang , Ruijie Tao , Yanmin Qian , Liqun Deng , Longshuai Xiao , and Haizhou Li
    CoRR, Oct 2023
  31. Leveraging In-the-Wild Data for Effective Self-Supervised Pretraining in Speaker Recognition
    Shuai Wang , Qibing Bai , Qi Liu , Jianwei Yu , Zhengyang Chen , Bing Han , Yanmin Qian , and Haizhou Li
    CoRR, Oct 2023
  32. The second multi-channel multi-party meeting transcription challenge (M2MeT) 2.0): A benchmark for speaker-attributed ASR
    Yuhao Liang , Mohan Shi , Fan Yu , Yangze Li , Shiliang Zhang , Zhihao Du , Qian Chen , Lei Xie , Yanmin Qian , Jian Wu , Zhuo Chen , Kong Aik Lee , Zhijie Yan , and Hui Bu
    CoRR, Oct 2023
  33. Diffusion Conditional Expectation Model for Efficient and Robust Target Speech Extraction
    Leying Zhang , Yao Qian , Linfeng Yu , Heming Wang , Xinkai Wang , Hemin Yang , Long Zhou , Shujie Liu , Yanmin Qian , and Michael Zeng
    CoRR, Oct 2023
  34. Toward Universal Speech Enhancement for Diverse Input Conditions
    Wangyou Zhang , Kohei Saijo , Zhong-Qiu Wang , Shinji Watanabe , and Yanmin Qian
    CoRR, Oct 2023
  35. One-Shot Sensitivity-Aware Mixed Sparsity Pruning for Large Language Models
    Hang Shao , Bei Liu , and Yanmin Qian
    CoRR, Oct 2023
  36. FAT-HuBERT: Front-end Adaptive Training of Hidden-unit BERT for Distortion-Invariant Robust Speech Recognition
    Dongning Yang , Wei Wang , and Yanmin Qian
    CoRR, Oct 2023
  37. Speaker Adaptive Text-to-Speech With Timbre-Normalized Vector-Quantized Feature
    Chenpeng Du , Yiwei Guo , Xie Chen, and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2023
  38. Fast-Hubert: an Efficient Training Framework for Self-Supervised Speech Representation Learning
    Guanrou Yang , Ziyang Ma , Zhisheng Zheng , Yakun Song , Zhikang Niu , and Xie Chen
    In IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2023, Taipei, Taiwan, December 16-20, 2023 , Oct 2023
  39. Improving Few-Shot Learning for Talking Face System with TTS Data Augmentation
    Qi Chen , Ziyang Ma , Tao Liu , Xu Tan , Qu Lu , Kai Yu , and Xie Chen
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , Oct 2023
  40. Front-End Adapter: Adapting Front-End Input of Speech Based Self-Supervised Learning for Speech Recognition
    Xie Chen, Ziyang Ma , Changli Tang , Yujin Wang , and Zhisheng Zheng
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , Oct 2023
  41. Emodiff: Intensity Controllable Emotional Text-to-Speech with Soft-Label Guidance
    Yiwei Guo , Chenpeng Du , Xie Chen, and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , Oct 2023
  42. DAE-Talker: High Fidelity Speech-Driven Talking Face Generation with Diffusion Autoencoder
    Chenpeng Du , Qi Chen , Tianyu He , Xu Tan , Xie ChenKai Yu, Sheng Zhao , and Jiang Bian
    In Proceedings of the 31st ACM International Conference on Multimedia, MM 2023, Ottawa, ON, Canada, 29 October 2023- 3 November 2023 , Oct 2023
  43. Blank-regularized CTC for Frame Skipping in Neural Transducer
    Yifan Yang , Xiaoyu Yang , Liyong Guo , Zengwei Yao , Wei Kang , Fangjun Kuang , Long Lin , Xie Chen, and Daniel Povey
    CoRR, Oct 2023
  44. UniCATS: A Unified Context-Aware Text-to-Speech Framework with Contextual VQ-Diffusion and Vocoding
    Chenpeng Du , Yiwei Guo , Feiyu Shen , Zhijun Liu , Zheng Liang , Xie Chen, Shuai Wang , Hui Zhang , and Kai Yu
    CoRR, Oct 2023
  45. Improving Code-Switching and Named Entity Recognition in ASR with Speech Editing based Data Augmentation
    Zheng Liang , Zheshu Song , Ziyang Ma , Chenpeng Du , Kai Yu , and Xie Chen
    CoRR, Oct 2023
  46. Pushing the Limits of Unsupervised Unit Discovery for SSL Speech Representation
    Ziyang Ma , Zhisheng Zheng , Guanrou Yang , Yu Wang , Chao Zhang , and Xie Chen
    CoRR, Oct 2023
  47. Towards Effective and Compact Contextual Representation for Conformer Transducer Speech Recognition Systems
    Mingyu Cui , Jiawen Kang , Jiajun Deng , Xi Yin , Yutao Xie , Xie Chen, and Xunying Liu
    CoRR, Oct 2023
  48. DSE-TTS: Dual Speaker Embedding for Cross-Lingual Text-to-Speech
    Sen Liu , Yiwei Guo , Chenpeng Du , Xie Chen, and Kai Yu
    CoRR, Oct 2023
  49. Unsupervised Active Learning: Optimizing Labeling Cost-Effectiveness for Automatic Speech Recognition
    Zhisheng Zheng , Ziyang Ma , Yu Wang , and Xie Chen
    CoRR, Oct 2023
  50. VoiceFlow: Efficient Text-to-Speech with Rectified Flow Matching
    Yiwei Guo , Chenpeng Du , Ziyang Ma , Xie Chen, and Kai Yu
    CoRR, Oct 2023
  51. Towards Universal Speech Discrete Tokens: A Case Study for ASR and TTS
    Yifan Yang , Feiyu Shen , Chenpeng Du , Ziyang Ma , Kai Yu, Daniel Povey , and Xie Chen
    CoRR, Oct 2023
  52. Incorporating Class-based Language Model for Named Entity Recognition in Factorized Neural Transducer
    Peng Wang , Yifan Yang , Zheng Liang , Tian Tan , Shiliang Zhang , and Xie Chen
    CoRR, Oct 2023
  53. Improved Factorized Neural Transducer Model For text-only Domain Adaptation
    Junzhe Liu , Jianwei Yu , and Xie Chen
    CoRR, Oct 2023
  54. Leveraging Speech PTM, Text LLM, and Emotional TTS for Speech Emotion Recognition
    Ziyang Ma , Wen Wu , Zhisheng Zheng , Yiwei Guo , Qian Chen , Shiliang Zhang , and Xie Chen
    CoRR, Oct 2023
  55. Acoustic BPE for Speech Generation with Discrete Tokens
    Feiyu Shen , Yiwei Guo , Chenpeng Du , Xie Chen, and Kai Yu
    CoRR, Oct 2023
  56. Expressive TTS Driven by Natural Language Prompts Using Few Human Annotations
    Hanglei Zhang , Yiwei Guo , Sen Liu , Xie Chen, and Kai Yu
    CoRR, Oct 2023
  57. emotion2vec: Self-Supervised Pre-Training for Speech Emotion Representation
    Ziyang Ma , Zhisheng Zheng , Jiaxin Ye , Jinchao Li , Zhifu Gao , Shiliang Zhang , and Xie Chen
    CoRR, Oct 2023
  58. OPAL: Ontology-Aware Pretrained Language Model for End-to-End Task-Oriented Dialogue
    Zhi Chen , Yuncong Liu , Lu Chen , Su Zhu , Mengyue Wu, and Kai Yu
    Trans. Assoc. Comput. Linguistics, Oct 2023
  59. Transcribing Vocal Communications of Domestic Shiba lnu Dogs
    Jieyi Huang , Chunhao Zhang , Mengyue Wu , and Kenny Q. Zhu
    In Findings of the Association for Computational Linguistics: ACL 2023, Toronto, Canada, July 9-14, 2023 , Oct 2023
  60. Detection of Multiple Mental Disorders from Social Media with Two-Stream Psychiatric Experts
    Siyuan Chen , Zhiling Zhang , Mengyue Wu , and Kenny Q. Zhu
    In Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing, EMNLP 2023, Singapore, December 6-10, 2023 , Oct 2023
  61. Semantic Space Grounded Weighted Decoding for Multi-Attribute Controllable Dialogue Generation
    Zhiling Zhang , Mengyue Wu , and Kenny Q. Zhu
    In Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing, EMNLP 2023, Singapore, December 6-10, 2023 , Oct 2023
  62. Diverse and Vivid Sound Generation from Text Descriptions
    Guangwei Li , Xuenan Xu , Lingfeng Dai , Mengyue Wu, and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , Oct 2023
  63. Investigating Pooling Strategies and Loss Functions for Weakly-Supervised Text-to-Audio Grounding via Contrastive Learning
    Xuenan Xu , Mengyue Wu, and Kai Yu
    In IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2023 - Workshops, Rhodes Island, Greece, June 4-10, 2023 , Oct 2023
  64. BLAT: Bootstrapping Language-Audio Pre-training based on AudioSet Tag-guided Synthetic Data
    Xuenan Xu , Zhiling Zhang , Zelin Zhou , Pingyue Zhang , Zeyu Xie , Mengyue Wu , and Kenny Q. Zhu
    In Proceedings of the 31st ACM International Conference on Multimedia, MM 2023, Ottawa, ON, Canada, 29 October 2023- 3 November 2023 , Oct 2023
  65. LLM-empowered Chatbots for Psychiatrist and Patient Simulation: Application and Evaluation
    Siyuan Chen , Mengyue Wu , Kenny Q. Zhu , Kunyao Lan , Zhiling Zhang , and Lyuchun Cui
    CoRR, Oct 2023
  66. Enhance Temporal Relations in Audio Captioning with Sound Event Detection
    Zeyu Xie , Xuenan Xu , Mengyue Wu, and Kai Yu
    CoRR, Oct 2023
  67. Improving Audio Caption Fluency with Automatic Error Correction
    Hanxue Zhang , Zeyu Xie , Xuenan Xu , Mengyue Wu, and Kai Yu
    CoRR, Oct 2023
  68. A Large-scale Dataset for Audio-Language Representation Learning
    Luoyi Sun , Xuenan Xu , Mengyue Wu, and Weidi Xie
    CoRR, Oct 2023
  69. Does My Dog "Speak" Like Me? The Acoustic Correlation between Pet Dogs and Their Human Owners
    Jieyi Huang , Chunhao Zhang , Yufei Wang , Mengyue Wu , and Kenny Q. Zhu
    CoRR, Oct 2023
  70. Towards Lexical Analysis of Dog Vocalizations via Online Videos
    Yufei Wang , Chunhao Zhang , Jieyi Huang , Mengyue Wu , and Kenny Q. Zhu
    CoRR, Oct 2023
  71. PsyEval: A Comprehensive Large Language Model Evaluation Benchmark for Mental Health
    Haoan Jin , Siyuan Chen , Mengyue Wu , and Kenny Q. Zhu
    CoRR, Oct 2023
  72. A Heterogeneous Graph to Abstract Syntax Tree Framework for Text-to-SQL
    Ruisheng Cao , Lu Chen, Jieyu Li , Hanchong Zhang , Hongshen Xu , Wangyou Zhang , and Kai Yu
    IEEE Trans. Pattern Anal. Mach. Intell., Oct 2023
  73. Speech Enhancement With Integration of Neural Homomorphic Synthesis and Spectral Masking
    Wenbin Jiang , and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2023
  74. SPM: A Split-Parsing Method for Joint Multi-Intent Detection and Slot Filling
    Sheng Jiang , Su Zhu , Ruisheng Cao , Qingliang Miao , and Kai Yu
    In Proceedings of the The 61st Annual Meeting of the Association for Computational Linguistics: Industry Track, ACL 2023, Toronto, Canada, July 9-14, 2023 , Oct 2023
  75. Exploring Schema Generalizability of Text-to-SQL
    Jieyu Li , Lu Chen, Ruisheng Cao , Su Zhu , Hongshen Xu , Zhi Chen , Hanchong Zhang , and Kai Yu
    In Findings of the Association for Computational Linguistics: ACL 2023, Toronto, Canada, July 9-14, 2023 , Oct 2023
  76. TeCS: A Dataset and Benchmark for Tense Consistency of Machine Translation
    Yiming Ai , Zhiwei He , Kai Yu, and Rui Wang
    In Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers), ACL 2023, Toronto, Canada, July 9-14, 2023 , Oct 2023
  77. CSS: A Large-scale Cross-schema Chinese Text-to-SQL Medical Dataset
    Hanchong Zhang , Jieyu Li , Lu Chen, Ruisheng Cao , Yunyan Zhang , Yu Huang , Yefeng Zheng , and Kai Yu
    In Findings of the Association for Computational Linguistics: ACL 2023, Toronto, Canada, July 9-14, 2023 , Oct 2023
  78. ACT-SQL: In-Context Learning for Text-to-SQL with Automatically-Generated Chain-of-Thought
    Hanchong Zhang , Ruisheng Cao , Lu Chen, Hongshen Xu , and Kai Yu
    In Findings of the Association for Computational Linguistics: EMNLP 2023, Singapore, December 6-10, 2023 , Oct 2023
  79. Multi-Speaker Multi-Lingual VQTTS System for LIMMITS 2023 Challenge
    Chenpeng Du , Yiwei Guo , Feiyu Shen , and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , Oct 2023
  80. DiffVoice: Text-to-Speech with Latent Diffusion
    Zhijun Liu , Yiwei Guo , and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , Oct 2023
  81. Large Language Models Are Semi-Parametric Reinforcement Learning Agents
    Danyang Zhang , Lu Chen, Situo Zhang , Hongshen Xu , Zihan Zhao , and Kai Yu
    In Advances in Neural Information Processing Systems 36: Annual Conference on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans, LA, USA, December 10 - 16, 2023 , Oct 2023
  82. Mobile-Env: A Universal Platform for Training and Evaluation of Mobile Interaction
    Danyang Zhang , Lu Chen, and Kai Yu
    CoRR, Oct 2023
  83. SciEval: A Multi-Level Large Language Model Evaluation Benchmark for Scientific Research
    Liangtai Sun , Yang Han , Zihan Zhao , Da Ma , Zhennan Shen , Baocai Chen , Lu Chen, and Kai Yu
    CoRR, Oct 2023
  84. ASTormer: An AST Structure-aware Transformer Decoder for Text-to-SQL
    Ruisheng Cao , Hanchong Zhang , Hongshen Xu , Jieyu Li , Da Ma , Lu Chen, and Kai Yu
    CoRR, Oct 2023
  85. DiffDub: Person-generic Visual Dubbing Using Inpainting Renderer with Diffusion Auto-encoder
    Tao Liu , Chenpeng Du , Shuai Fan , Feilong Chen , and Kai Yu
    CoRR, Oct 2023
  86. SEF-VC: Speaker Embedding Free Zero-Shot Voice Conversion with Cross Attention
    Junjie Li , Yiwei Guo , Xie Chen, and Kai Yu
    CoRR, Oct 2023

2022

  1. Heterogeneous Graph Representation for Knowledge Tracing
    Jisen Chen , Jian Shen , Ting Long , Liping Shen, Weinan Zhang , and Yong Yu
    In Neural Information Processing - 29th International Conference, ICONIP 2022, Virtual Event, November 22-26, 2022, Proceedings, Part I , Oct 2022
  2. A simple but practical method: How to improve the usage of entities in the Chinese question generation
    Haoze Yang , Kunyao Lan , Jiawei You , and Liping Shen
    In International Joint Conference on Neural Networks, IJCNN 2022, Padua, Italy, July 18-23, 2022 , Oct 2022
  3. From Uniform Models To Generic Representations: Stock Return Prediction With Pre-training
    Jiawei You , Tianyuan Han , and Liping Shen
    In International Joint Conference on Neural Networks, IJCNN 2022, Padua, Italy, July 18-23, 2022 , Oct 2022
  4. WavLM: Large-Scale Self-Supervised Pre-Training for Full Stack Speech Processing
    Sanyuan Chen , Chengyi Wang , Zhengyang Chen , Yu Wu , Shujie Liu , Zhuo Chen , Jinyu Li , Naoyuki Kanda , Takuya Yoshioka , Xiong Xiao , Jian Wu , Long Zhou , Shuo Ren , Yanmin Qian , Yao Qian , Jian Wu , Michael Zeng , Xiangzhan Yu , and Furu Wei
    IEEE J. Sel. Top. Signal Process., Oct 2022
  5. Optimizing Data Usage for Low-Resource Speech Recognition
    Yanmin Qian , and Zhikai Zhou
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2022
  6. Dual-Path Modeling With Memory Embedding Model for Continuous Speech Separation
    Chenda Li , Zhuo Chen , and Yanmin Qian
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2022
  7. Layer-Wise Fast Adaptation for End-to-End Multi-Accent Speech Recognition
    Yanmin Qian , Xun Gong , and Houjun Huang
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2022
  8. End-to-End Dereverberation, Beamforming, and Speech Recognition in a Cocktail Party
    Wangyou Zhang , Xuankai Chang , Christoph Böddeker , Tomohiro Nakatani , Shinji Watanabe , and Yanmin Qian
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2022
  9. Time-Domain Audio-Visual Speech Separation on Low Quality Videos
    Yifei Wu , Chenda Li , Jinfeng Bai , Zhongqin Wu , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  10. Skim: Skipping Memory Lstm for Low-Latency Real-Time Continuous Speech Separation
    Chenda Li , Lei Yang , Weiqin Wang , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  11. Large-Scale Self-Supervised Speech Representation Learning for Automatic Speaker Verification
    Zhengyang Chen , Sanyuan Chen , Yu Wu , Yao Qian , Chengyi Wang , Shujie Liu , Yanmin Qian , and Michael Zeng
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  12. Local Information Modeling with Self-Attention for Speaker Verification
    Bing Han , Zhengyang Chen , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  13. Punctuation Prediction for Streaming On-Device Speech Recognition
    Zhikai Zhou , Tian Tan , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  14. MLP-SVNET: A Multi-Layer Perceptrons Based Network for Speaker Verification
    Bing Han , Zhengyang Chen , Bei Liu , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  15. Self-Knowledge Distillation via Feature Enhancement for Speaker Verification
    Bei Liu , Haoyu Wang , Zhengyang Chen , Shuai Wang , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  16. Optimizing Alignment of Speech and Language Latent Spaces for End-To-End Speech Recognition and Understanding
    Wei Wang , Shuo Ren , Yao Qian , Shujie Liu , Yu Shi , Yanmin Qian , and Michael Zeng
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  17. Exploring Effective Data Utilization for Low-Resource Speech Recognition
    Zhikai Zhou , Wei Wang , Wangyou Zhang , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  18. Summary on the ICASSP 2022 Multi-Channel Multi-Party Meeting Transcription Grand Challenge
    Fan Yu , Shiliang Zhang , Pengcheng Guo , Yihui Fu , Zhihao Du , Siqi Zheng , Weilong Huang , Lei Xie , Zheng-Hua Tan , DeLiang Wang , Yanmin Qian , Kong Aik Lee , Zhijie Yan , Bin Ma , Xin Xu , and Hui Bu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  19. The Sjtu System For Multimodal Information Based Speech Processing Challenge 2021
    Wei Wang , Xun Gong , Yifei Wu , Zhikai Zhou , Chenda Li , Wangyou Zhang , Bing Han , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  20. Attentive Feature Fusion for Robust Speaker Verification
    Bei Liu , Zhengyang Chen , and Yanmin Qian
    In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
  21. Dual Path Embedding Learning for Speaker Verification with Triplet Attention
    Bei Liu , Zhengyang Chen , and Yanmin Qian
    In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
  22. DF-ResNet: Boosting Speaker Verification Performance with Depth-First Design
    Bei Liu , Zhengyang Chen , Shuai Wang , Haoyu Wang , Bing Han , and Yanmin Qian
    In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
  23. Enroll-Aware Attentive Statistics Pooling for Target Speaker Verification
    Leying Zhang , Zhengyang Chen , and Yanmin Qian
    In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
  24. MSDWild: Multi-modal Speaker Diarization Dataset in the Wild
    Tao Liu , Shuai Fan , Xu Xiang , Hongbo Song , Shaoxiong Lin , Jiaqi Sun , Tianyuan Han , Siyuan Chen , Binwei Yao , Sen Liu , Yifei Wu , Yanmin Qian , and Kai Yu
    In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
  25. Knowledge Transfer and Distillation from Autoregressive to Non-Autoregessive Speech Recognition
    Xun Gong , Zhikai Zhou , and Yanmin Qian
    In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
  26. Self-Supervised Speaker Verification Using Dynamic Loss-Gate and Label Correction
    Bing Han , Zhengyang Chen , and Yanmin Qian
    In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
  27. Separating Long-Form Speech with Group-wise Permutation Invariant Training
    Wangyou Zhang , Zhuo Chen , Naoyuki Kanda , Shujie Liu , Jinyu Li , Sefik Emre Eskimez , Takuya Yoshioka , Xiong Xiao , Zhong Meng , Yanmin Qian , and Furu Wei
    In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
  28. ESPnet-SE++: Speech Enhancement for Robust Speech Recognition, Translation, and Understanding
    Yen-Ju Lu , Xuankai Chang , Chenda Li , Wangyou Zhang , Samuele Cornell , Zhaoheng Ni , Yoshiki Masuyama , Brian Yan , Robin Scheibler , Zhong-Qiu Wang , Yu Tsao , Yanmin Qian , and Shinji Watanabe
    In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
  29. Improving Speech Separation with Knowledge Distilled from Self-supervised Pre-trained Models
    Bowen Qu , Chenda Li , Jinfeng Bai , and Yanmin Qian
    In 13th International Symposium on Chinese Spoken Language Processing, ISCSLP 2022, Singapore, December 11-14, 2022 , Oct 2022
  30. Text-Informed Knowledge Distillation for Robust Speech Enhancement and Recognition
    Wei Wang , Wangyou Zhang , Shaoxiong Lin , and Yanmin Qian
    In 13th International Symposium on Chinese Spoken Language Processing, ISCSLP 2022, Singapore, December 11-14, 2022 , Oct 2022
  31. Medical Difficult Airway Detection using Speech Technology
    Zhikai Zhou , Shuang Cao , Zhengyang Chen , Bei Liu , Ming Xia , Hong Jiang , and Yanmin Qian
    In 13th International Symposium on Chinese Spoken Language Processing, ISCSLP 2022, Singapore, December 11-14, 2022 , Oct 2022
  32. Speaking style compensation on synthetic audio for robust keyword spotting
    Houjun Huang , and Yanmin Qian
    In 13th International Symposium on Chinese Spoken Language Processing, ISCSLP 2022, Singapore, December 11-14, 2022 , Oct 2022
  33. The Conversational Short-phrase Speaker Diarization (CSSD) Task: Dataset, Evaluation Metric and Baselines
    Gaofeng Cheng , Yifan Chen , Runyan Yang , Qingxuan Li , Zehui Yang , Lingxuan Ye , Pengyuan Zhang , Qingqing Zhang , Lei Xie , Yanmin Qian , Kong Aik Lee , and Yonghong Yan
    In 13th International Symposium on Chinese Spoken Language Processing, ISCSLP 2022, Singapore, December 11-14, 2022 , Oct 2022
  34. The X-Lance Speaker Diarization System for the Conversational Short-phrase Speaker Diarization Challenge 2022
    Tao Liu , Xu Xiang , Zhengyang Chen , Bing Han , Kai Yu, and Yanmin Qian
    In 13th International Symposium on Chinese Spoken Language Processing, ISCSLP 2022, Singapore, December 11-14, 2022 , Oct 2022
  35. End-to-End Multi-Speaker ASR with Independent Vector Analysis
    Robin Scheibler , Wangyou Zhang , Xuankai Chang , Shinji Watanabe , and Yanmin Qian
    In IEEE Spoken Language Technology Workshop, SLT 2022, Doha, Qatar, January 9-12, 2023 , Oct 2022
  36. A Comprehensive Study on Self-Supervised Distillation for Speaker Representation Learning
    Zhengyang Chen , Yao Qian , Bing Han , Yanmin Qian , and Michael Zeng
    In IEEE Spoken Language Technology Workshop, SLT 2022, Doha, Qatar, January 9-12, 2023 , Oct 2022
  37. The SJTU X-LANCE Lab System for CNSRC 2022
    Zhengyang Chen , Bei Liu , Bing Han , Leying Zhang , and Yanmin Qian
    CoRR, Oct 2022
  38. SJTU-AISPEECH System for VoxCeleb Speaker Recognition Challenge 2022
    Zhengyang Chen , Bing Han , Xu Xiang , Houjun Huang , Bei Liu , and Yanmin Qian
    CoRR, Oct 2022
  39. Build a SRE Challenge System: Lessons from VoxSRC 2022 and CNSRC 2022
    Zhengyang Chen , Bing Han , Xu Xiang , Houjun Huang , Bei Liu , and Yanmin Qian
    CoRR, Oct 2022
  40. Factorized Neural Transducer for Efficient Language Model Adaptation
    Xie Chen, Zhong Meng , Sarangarajan Parthasarathy , and Jinyu Li
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  41. VQTTS: High-Fidelity Text-to-Speech Synthesis with Self-Supervised VQ Acoustic Feature
    Chenpeng Du , Yiwei Guo , Xie Chen, and Kai Yu
    In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
  42. Internal Language Model Adaptation with Text-Only Data for End-to-End Speech Recognition
    Zhong Meng , Yashesh Gaur , Naoyuki Kanda , Jinyu Li , Xie Chen , Yu Wu , and Yifan Gong
    In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
  43. Exploring Effective Distillation of Self-Supervised Speech Models for Automatic Speech Recognition
    Yujin Wang , Changli Tang , Ziyang Ma , Zhisheng Zheng , Xie Chen, and Wei-Qiang Zhang
    CoRR, Oct 2022
  44. MT4SSL: Boosting Self-Supervised Speech Representation Learning by Integrating Multiple Targets
    Ziyang Ma , Zhisheng Zheng , Changli Tang , Yujin Wang , and Xie Chen
    CoRR, Oct 2022
  45. EmoDiff: Intensity Controllable Emotional Text-to-Speech with Soft-Label Guidance
    Yiwei Guo , Chenpeng Du , Xie Chen, and Kai Yu
    CoRR, Oct 2022
  46. Exploring Effective Fusion Algorithms for Speech Based Self-Supervised Learning Models
    Changli Tang , Yujin Wang , Xie Chen, and Wei-Qiang Zhang
    CoRR, Oct 2022
  47. D4: a Chinese Dialogue Dataset for Depression-Diagnosis-Oriented Chat
    Binwei Yao , Chao Shi , Likai Zou , Lingfeng Dai , Mengyue WuLu Chen, Zhen Wang , and Kai Yu
    In Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing, EMNLP 2022, Abu Dhabi, United Arab Emirates, December 7-11, 2022 , Oct 2022
  48. Symptom Identification for Interpretable Detection of Multiple Mental Disorders on Social Media
    Zhiling Zhang , Siyuan Chen , Mengyue Wu , and Kenny Q. Zhu
    In Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing, EMNLP 2022, Abu Dhabi, United Arab Emirates, December 7-11, 2022 , Oct 2022
  49. Category-Adapted Sound Event Enhancement with Weakly Labeled Data
    Guangwei Li , Xuenan Xu , Heinrich Dinkel , Mengyue Wu, and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  50. Diversity-Controllable and Accurate Audio Captioning Based on Neural Condition
    Xuenan Xu , Mengyue Wu, and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  51. Can Audio Captions Be Evaluated With Image Caption Metrics?
    Zelin Zhou , Zhiling Zhang , Xuenan Xu , Zeyu Xie , Mengyue Wu , and Kenny Q. Zhu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  52. Navigating Audio-Visual Event Detection Across Mismatched Modalities
    Guangwei Li , Xuenan Xu , Mengyue Wu, and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  53. Audio-Text Retrieval in Context
    Siyu Lou , Xuenan Xu , Mengyue Wu, and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  54. Climate and Weather: Inspecting Depression Detection via Emotion Recognition
    Wen Wu , Mengyue Wu, and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  55. Psychiatric Scale Guided Risky Post Screening for Early Detection of Depression
    Zhiling Zhang , Siyuan Chen , Mengyue Wu , and Kenny Q. Zhu
    In Proceedings of the Thirty-First International Joint Conference on Artificial Intelligence, IJCAI 2022, Vienna, Austria, 23-29 July 2022 , Oct 2022
  56. A Comprehensive Survey of Automated Audio Captioning
    Xuenan Xu , Mengyue Wu, and Kai Yu
    CoRR, Oct 2022
  57. DialogZoo: Large-Scale Dialog-Oriented Task Learning
    Zhi Chen , Jijia Bao , Lu Chen, Yuncong Liu , Da Ma , Bei Chen , Mengyue Wu , Su Zhu , Jian-Guang Lou , and Kai Yu
    CoRR, Oct 2022
  58. Data augmentation based non-parallel voice conversion with frame-level speaker disentangler
    Bo Chen , Zhihang Xu , and Kai Yu
    Speech Commun., Oct 2022
  59. Phone-Level Prosody Modelling With GMM-Based MDN for Diverse and Controllable Speech Synthesis
    Chenpeng Du , and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2022
  60. Neural Fusion for Voice Cloning
    Bo Chen , Chenpeng Du , and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2022
  61. META-GUI: Towards Multi-modal Conversational Agents on Mobile GUI
    Liangtai Sun , Xingyu Chen , Lu Chen, Tianle Dai , Zichen Zhu, and Kai Yu
    In Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing, EMNLP 2022, Abu Dhabi, United Arab Emirates, December 7-11, 2022 , Oct 2022
  62. AdapterShare: Task Correlation Modeling with Adapter Differentiation
    Zhi Chen , Bei Chen , Lu ChenKai Yu, and Jian-Guang Lou
    In Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing, EMNLP 2022, Abu Dhabi, United Arab Emirates, December 7-11, 2022 , Oct 2022
  63. LatticeBART: Lattice-to-Lattice Pre-Training for Speech Recognition
    Lingfeng Dai , Lu Chen, Zhikai Zhou , and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  64. Text Adaptive Detection for Customizable Keyword Spotting
    Yu Xi , Tian Tan , Wangyou Zhang , Baochen Yang , and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  65. Unsupervised Word-Level Prosody Tagging for Controllable Speech Synthesis
    Yiwei Guo , Chenpeng Du , and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  66. The AISP-SJTU Simultaneous Translation System for IWSLT 2022
    Qinpei Zhu , Renshou Wu , Guangfeng Liu , Xinyu Zhu , Xingyu Chen , Yang Zhou , Qingliang Miao , Rui Wang , and Kai Yu
    In Proceedings of the 19th International Conference on Spoken Language Translation, IWSLT@ACL 2022, Dublin, Ireland (in-person and online), May 26-27, 2022 , Oct 2022
  67. TIE: Topological Information Enhanced Structural Reading Comprehension on Web Pages
    Zihan Zhao , Lu Chen, Ruisheng Cao , Hongshen Xu , Xingyu Chen , and Kai Yu
    In Proceedings of the 2022 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, NAACL 2022, Seattle, WA, United States, July 10-15, 2022 , Oct 2022
  68. UniDU: Towards A Unified Generative Dialogue Understanding Framework
    Zhi Chen , Lu Chen , Bei Chen , Libo Qin , Yuncong Liu , Su Zhu , Jian-Guang Lou , and Kai Yu
    In Proceedings of the 23rd Annual Meeting of the Special Interest Group on Discourse and Dialogue, SIGDIAL 2022, Edinburgh, UK, 07-09 September 2022 , Oct 2022
  69. The AISP-SJTU Translation System for WMT 2022
    Guangfeng Liu , Qinpei Zhu , Xingyu Chen , Renjie Feng , Jianxin Ren , Renshou Wu , Qingliang Miao , Rui Wang , and Kai Yu
    In Proceedings of the Seventh Conference on Machine Translation, WMT 2022, Abu Dhabi, United Arab Emirates (Hybrid), December 7-8, 2022 , Oct 2022

2021

  1. Modified Magnitude-Phase Spectrum Information for Spoofing Detection
    Jichen Yang , Hongji Wang , Rohan Kumar Das , and Yanmin Qian
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2021
  2. Audio-Visual Deep Neural Network for Robust Person Verification
    Yanmin Qian , Zhengyang Chen , and Shuai Wang
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2021
  3. Dual-Path Modeling for Long Recording Speech Separation in Meetings
    Chenda Li , Zhuo Chen , Yi Luo , Cong Han , Tianyan Zhou , Keisuke Kinoshita , Marc Delcroix , Shinji Watanabe , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
  4. Self-Supervised Learning Based Domain Adaptation for Robust Speaker Verification
    Zhengyang Chen , Shuai Wang , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
  5. SynAug: Synthesis-Based Data Augmentation for Text-Dependent Speaker Verification
    Chenpeng Du , Bing Han , Shuai Wang , Yanmin Qian , and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
  6. Unit Selection Synthesis Based Data Augmentation for Fixed Phrase Speaker Verification
    Houjun Huang , Xu Xiang , Fei Zhao , Shuai Wang , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
  7. AISpeech-SJTU Accent Identification System for the Accented English Speech Recognition Challenge
    Houjun Huang , Xu Xiang , Yexin Yang , Rao Ma , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
  8. AISpeech-SJTU ASR System for the Accented English Speech Recognition Challenge
    Tian Tan , Yizhou Lu , Rao Ma , Sen Zhu , Jiaqi Guo , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
  9. Towards Data Selection on TTS Data for Children’s Speech Recognition
    Wei Wang , Zhikai Zhou , Yizhou Lu , Hongji Wang , Chenpeng Du , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
  10. End-to-End Dereverberation, Beamforming, and Speech Recognition with Improved Numerical Stability and Advanced Frontend
    Wangyou Zhang , Christoph Böddeker , Shinji Watanabe , Tomohiro Nakatani , Marc Delcroix , Keisuke Kinoshita , Tsubasa Ochiai , Naoyuki Kamo , Reinhold Haeb-Umbach , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
  11. The Accented English Speech Recognition Challenge 2020: Open Datasets, Tracks, Baselines, Results and Methods
    Xian Shi , Fan Yu , Yizhou Lu , Yuhao Liang , Qiangze Feng , Daliang Wang , Yanmin Qian , and Lei Xie
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
  12. Convolutive Transfer Function Invariant SDR Training Criteria for Multi-Channel Reverberant Speech Separation
    Christoph Böddeker , Wangyou Zhang , Tomohiro Nakatani , Keisuke Kinoshita , Tsubasa Ochiai , Marc Delcroix , Naoyuki Kamo , Yanmin Qian , and Reinhold Haeb-Umbach
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
  13. Layer-Wise Fast Adaptation for End-to-End Multi-Accent Speech Recognition
    Xun Gong , Yizhou Lu , Zhikai Zhou , and Yanmin Qian
    In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
  14. Knowledge Distillation from Multi-Modality to Single-Modality for Person Verification
    Leying Zhang , Zhengyang Chen , and Yanmin Qian
    In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
  15. Basis-MelGAN: Efficient Neural Vocoder Based on Audio Decomposition
    Zhengxi Liu , and Yanmin Qian
    In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
  16. The SJTU System for Short-Duration Speaker Verification Challenge 2021
    Bing Han , Zhengyang Chen , Zhikai Zhou , and Yanmin Qian
    In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
  17. Audio-Visual Multi-Talker Speech Recognition in a Cocktail Party
    Yifei Wu , Chenda Li , Song Yang , Zhongqin Wu , and Yanmin Qian
    In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
  18. Speaker Embedding Augmentation with Noise Distribution Matching
    Xun Gong , Zhengyang Chen , Yexin Yang , Shuai Wang , Lan Wang , and Yanmin Qian
    In 12th International Symposium on Chinese Spoken Language Processing, ISCSLP 2021, Hong Kong, January 24-27, 2021 , Oct 2021
  19. Revisiting the Statistics Pooling Layer in Deep Speaker Embedding Learning
    Shuai Wang , Yexin Yang , Yanmin Qian , and Kai Yu
    In 12th International Symposium on Chinese Spoken Language Processing, ISCSLP 2021, Hong Kong, January 24-27, 2021 , Oct 2021
  20. Data Augmentation for end-to-end Code-Switching Speech Recognition
    Chenpeng Du , Hao Li , Yizhou Lu , Lan Wang , and Yanmin Qian
    In IEEE Spoken Language Technology Workshop, SLT 2021, Shenzhen, China, January 19-22, 2021 , Oct 2021
  21. Dual-Path RNN for Long Recording Speech Separation
    Chenda Li , Yi Luo , Cong Han , Jinyu Li , Takuya Yoshioka , Tianyan Zhou , Marc Delcroix , Keisuke Kinoshita , Christoph Böddeker , Yanmin Qian , Shinji Watanabe , and Zhuo Chen
    In IEEE Spoken Language Technology Workshop, SLT 2021, Shenzhen, China, January 19-22, 2021 , Oct 2021
  22. Closing the Gap Between Time-Domain Multi-Channel Speech Enhancement on Real and Simulation Conditions
    Wangyou Zhang , Jing Shi , Chenda Li , Shinji Watanabe , and Yanmin Qian
    In IEEE Workshop on Applications of Signal Processing to Audio and Acoustics, WASPAA 2021, New Paltz, NY, USA, October 17-20, 2021 , Oct 2021
  23. Towards Duration Robust Weakly Supervised Sound Event Detection
    Heinrich Dinkel , Mengyue Wu, and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2021
  24. Voice Activity Detection in the Wild: A Data-Driven Approach Using Teacher-Student Training
    Heinrich Dinkel , Shuai Wang , Xuenan Xu , Mengyue Wu, and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2021
  25. Building Interpretable Interaction Trees for Deep NLP Models
    Die Zhang , Hao Zhang , Huilin Zhou , Xiaoyi Bao , Da Huo , Ruizhao Chen , Xu Cheng , Mengyue Wu, and Quanshi Zhang
    In Thirty-Fifth AAAI Conference on Artificial Intelligence, AAAI 2021, Thirty-Third Conference on Innovative Applications of Artificial Intelligence, IAAI 2021, The Eleventh Symposium on Educational Advances in Artificial Intelligence, EAAI 2021, Virtual Event, February 2-9, 2021 , Oct 2021
  26. Decoupled Dialogue Modeling and Semantic Parsing for Multi-Turn Text-to-SQL
    Zhi Chen , Lu Chen, Hanqi Li , Ruisheng Cao , Da Ma , Mengyue Wu, and Kai Yu
    In Findings of the Association for Computational Linguistics: ACL/IJCNLP 2021, Online Event, August 1-6, 2021 , Oct 2021
  27. Enriching Ontology with Temporal Commonsense for Low-Resource Audio Tagging
    Zhiling Zhang , Zelin Zhou , Haifeng Tang , Guangwei Li , Mengyue Wu , and Kenny Q. Zhu
    In CIKM ’21: The 30th ACM International Conference on Information and Knowledge Management, Virtual Event, Queensland, Australia, November 1 - 5, 2021 , Oct 2021
  28. Text-to-Audio Grounding: Building Correspondence Between Captions and Sound Events
    Xuenan Xu , Heinrich Dinkel , Mengyue Wu, and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
  29. Investigating Local and Global Information for Automated Audio Captioning with Transfer Learning
    Xuenan Xu , Heinrich Dinkel , Mengyue Wu, Zeyu Xie , and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
  30. A Lightweight Framework for Online Voice Activity Detection in the Wild
    Xuenan Xu , Heinrich Dinkel , Mengyue Wu, and Kai Yu
    In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
  31. Audio Caption in a Car Setting with a Sentence-Level Loss
    Xuenan Xu , Heinrich Dinkel , Mengyue Wu, and Kai Yu
    In 12th International Symposium on Chinese Spoken Language Processing, ISCSLP 2021, Hong Kong, January 24-27, 2021 , Oct 2021
  32. DEPA: Self-Supervised Audio Embedding for Depression Detection
    Pingyue Zhang , Mengyue Wu, Heinrich Dinkel , and Kai Yu
    In MM ’21: ACM Multimedia Conference, Virtual Event, China, October 20 - 24, 2021 , Oct 2021
  33. LET: Linguistic Knowledge Enhanced Graph Transformer for Chinese Short Text Matching
    Boer Lyu , Lu Chen , Su Zhu , and Kai Yu
    In Thirty-Fifth AAAI Conference on Artificial Intelligence, AAAI 2021, Thirty-Third Conference on Innovative Applications of Artificial Intelligence, IAAI 2021, The Eleventh Symposium on Educational Advances in Artificial Intelligence, EAAI 2021, Virtual Event, February 2-9, 2021 , Oct 2021
  34. LGESQL: Line Graph Enhanced Text-to-SQL Model with Mixed Local and Non-Local Relations
    Ruisheng Cao , Lu Chen , Zhi Chen , Yanbin Zhao , Su Zhu , and Kai Yu
    In Proceedings of the 59th Annual Meeting of the Association for Computational Linguistics and the 11th International Joint Conference on Natural Language Processing, ACL/IJCNLP 2021, (Volume 1: Long Papers), Virtual Event, August 1-6, 2021 , Oct 2021
  35. WebSRC: A Dataset for Web-Based Structural Reading Comprehension
    Xingyu Chen , Zihan Zhao , Lu Chen, Jiabao Ji , Danyang Zhang , Ao Luo , Yuxuan Xiong , and Kai Yu
    In Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing, EMNLP 2021, Virtual Event / Punta Cana, Dominican Republic, 7-11 November, 2021 , Oct 2021
  36. Glyph Enhanced Chinese Character Pre-Training for Lexical Sememe Prediction
    Boer Lyu , Lu Chen, and Kai Yu
    In Findings of the Association for Computational Linguistics: EMNLP 2021, Virtual Event / Punta Cana, Dominican Republic, 16-20 November, 2021 , Oct 2021
  37. Class-Based Neural Network Language Model for Second-Pass Rescoring in ASR
    Lingfeng Dai , Qi Liu , and Kai Yu
    In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
  38. Rich Prosody Diversity Modelling with Phone-Level Mixture Density Network
    Chenpeng Du , and Kai Yu
    In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
  39. ShadowGNN: Graph Projection Neural Network for Text-to-SQL Parser
    Zhi Chen , Lu Chen, Yanbin Zhao , Ruisheng Cao , Zihan Xu , Su Zhu , and Kai Yu
    In Proceedings of the 2021 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, NAACL-HLT 2021, Online, June 6-11, 2021 , Oct 2021
  40. Few-Shot NLU with Vector Projection Distance and Abstract Triangular CRF
    Su Zhu , Lu Chen, Ruisheng Cao , Zhi Chen , Qingliang Miao , and Kai Yu
    In Natural Language Processing and Chinese Computing - 10th CCF International Conference, NLPCC 2021, Qingdao, China, October 13-17, 2021, Proceedings, Part I , Oct 2021
  41. Relation-Aware Multi-hop Reasoning forVisual Dialog
    Yao Zhao , Lu Chen, and Kai Yu
    In Natural Language Processing and Chinese Computing - 10th CCF International Conference, NLPCC 2021, Qingdao, China, October 13-17, 2021, Proceedings, Part I , Oct 2021
  42. Mixture Density Network for Phone-Level Prosody Modelling in Speech Synthesis
    Chenpeng Du , and Kai Yu
    CoRR, Oct 2021
  43. Diverse and Controllable Speech Synthesis with GMM-Based Phone-Level Prosody Modelling
    Chenpeng Du , and Kai Yu
    CoRR, Oct 2021

2020

  1. Improving End-to-End Single-Channel Multi-Talker Speech Recognition
    Wangyou Zhang , Xuankai Chang , Yanmin Qian , and Shinji Watanabe
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2020
  2. Data Augmentation Using Deep Generative Models for Embedding Based Speaker Recognition
    Shuai Wang , Yexin Yang , Zhanghao Wu , Yanmin Qian , and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2020
  3. End-To-End Multi-Speaker Speech Recognition With Transformer
    Xuankai Chang , Wangyou Zhang , Yanmin Qian , Jonathan Le Roux , and Shinji Watanabe
    In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
  4. Text Adaptation for Speaker Verification with Speaker-Text Factorized Embeddings
    Yexin Yang , Shuai Wang , Xun Gong , Yanmin Qian , and Kai Yu
    In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
  5. Channel Invariant Speaker Embedding Learning with Joint Multi-Task and Adversarial Training
    Zhengyang Chen , Shuai Wang , Yanmin Qian , and Kai Yu
    In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
  6. Deep Audio-Visual Speech Separation with Attention Mechanism
    Chenda Li , and Yanmin Qian
    In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
  7. Learning Contextual Language Embeddings for Monaural Multi-Talker Speech Recognition
    Wangyou Zhang , and Yanmin Qian
    In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
  8. End-to-End Far-Field Speech Recognition with Unified Dereverberation and Beamforming
    Wangyou Zhang , Aswin Shanmugam Subramanian , Xuankai Chang , Shinji Watanabe , and Yanmin Qian
    In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
  9. Dual-Adversarial Domain Adaptation for Generalized Replay Attack Detection
    Hongji Wang , Heinrich Dinkel , Shuai Wang , Yanmin Qian , and Kai Yu
    In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
  10. Listen, Watch and Understand at the Cocktail Party: Audio-Visual-Contextual Speech Separation
    Chenda Li , and Yanmin Qian
    In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
  11. Multi-Modality Matters: A Performance Leap on VoxCeleb
    Zhengyang Chen , Shuai Wang , and Yanmin Qian
    In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
  12. Adversarial Domain Adaptation for Speaker Verification Using Partially Shared Network
    Zhengyang Chen , Shuai Wang , and Yanmin Qian
    In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
  13. Bi-Encoder Transformer Network for Mandarin-English Code-Switching Speech Recognition Using Mixture of Experts
    Yizhou Lu , Mingkun Huang , Hao Li , Jiaqi Guo , and Yanmin Qian
    In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
  14. End-to-End Speaker-Dependent Voice Activity Detection
    Yefei Chen , Shuai Wang , Yanmin Qian , and Kai Yu
    CoRR, Oct 2020
  15. A CRNN-GRU Based Reinforcement Learning Approach to Audio Captioning
    Xuenan Xu , Heinrich Dinkel , Mengyue Wu, and Kai Yu
    In Proceedings of 5th the Workshop on Detection and Classification of Acoustic Scenes and Events 2020 (DCASE 2020), Tokyo, Japan (full virtual), November 2-4, 2020 , Oct 2020
  16. Multiple Sound Sources Localization from Coarse to Fine
    Rui Qian , Di Hu , Heinrich Dinkel , Mengyue Wu, Ning Xu , and Weiyao Lin
    In Computer Vision - ECCV 2020 - 16th European Conference, Glasgow, UK, August 23-28, 2020, Proceedings, Part XX , Oct 2020
  17. Voice Activity Detection in the Wild via Weakly Supervised Sound Event Detection
    Yefei Chen , Heinrich Dinkel , Mengyue Wu, and Kai Yu
    In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
  18. GPVAD: Towards noise robust voice activity detection via weakly supervised sound event detection
    Heinrich Dinkel , Yefei Chen , Mengyue Wu, and Kai Yu
    CoRR, Oct 2020
  19. Interpreting Hierarchical Linguistic Interactions in DNNs
    Die Zhang , Huilin Zhou , Xiaoyi Bao , Da Huo , Ruizhao Chen , Xu Cheng , Hao Zhang , Mengyue Wu, and Quanshi Zhang
    CoRR, Oct 2020
  20. Towards a new generation of artificial intelligence in China
    Fei Wu , Cewu Lu , Mingjie Zhu , Hao Chen , Jun Zhu , Kai Yu, Lei Li , Ming Li , Qianfeng Chen , Xi Li , Xudong Cao , Zhongyuan Wang , Zhengjun Zha , Yueting Zhuang , and Yunhe Pan
    Nat. Mach. Intell., Oct 2020
  21. Prior Knowledge Driven Label Embedding for Slot Filling in Natural Language Understanding
    Su Zhu , Zijian Zhao , Rao Ma , and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2020
  22. Dual Learning for Semi-Supervised Natural Language Understanding
    Su Zhu , Ruisheng Cao , and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2020
  23. Modular End-to-End Automatic Speech Recognition Framework for Acoustic-to-Word Model
    Qi Liu , Zhehuai Chen , Hao Li , Mingkun Huang , Yizhou Lu , and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2020
  24. Distributed Structured Actor-Critic Reinforcement Learning for Universal Dialogue Management
    Zhi Chen , Lu Chen, Xiaoyuan Liu , and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2020
  25. Neural Network Language Model Compression With Product Quantization and Soft Binarization
    Kai Yu, Rao Ma , Kaiyu Shi , and Qi Liu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2020
  26. Schema-Guided Multi-Domain Dialogue State Tracking with Graph Attention Neural Networks
    Lu Chen, Boer Lv , Chi Wang , Su Zhu , Bowen Tan , and Kai Yu
    In The Thirty-Fourth AAAI Conference on Artificial Intelligence, AAAI 2020, The Thirty-Second Innovative Applications of Artificial Intelligence Conference, IAAI 2020, The Tenth AAAI Symposium on Educational Advances in Artificial Intelligence, EAAI 2020, New York, NY, USA, February 7-12, 2020 , Oct 2020
  27. Semi-Supervised Text Simplification with Back-Translation and Asymmetric Denoising Autoencoders
    Yanbin Zhao , Lu Chen , Zhi Chen , and Kai Yu
    In The Thirty-Fourth AAAI Conference on Artificial Intelligence, AAAI 2020, The Thirty-Second Innovative Applications of Artificial Intelligence Conference, IAAI 2020, The Tenth AAAI Symposium on Educational Advances in Artificial Intelligence, EAAI 2020, New York, NY, USA, February 7-12, 2020 , Oct 2020
  28. Line Graph Enhanced AMR-to-Text Generation with Mix-Order Graph Attention Networks
    Yanbin Zhao , Lu Chen , Zhi Chen , Ruisheng Cao , Su Zhu , and Kai Yu
    In Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics, ACL 2020, Online, July 5-10, 2020 , Oct 2020
  29. Neural Graph Matching Networks for Chinese Short Text Matching
    Lu Chen, Yanbin Zhao , Boer Lyu , Lesheng Jin , Zhi Chen , Su Zhu , and Kai Yu
    In Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics, ACL 2020, Online, July 5-10, 2020 , Oct 2020
  30. Unsupervised Dual Paraphrasing for Two-stage Semantic Parsing
    Ruisheng Cao , Su Zhu , Chenyu Yang , Chen Liu , Rao Ma , Yanbin Zhao , Lu Chen, and Kai Yu
    In Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics, ACL 2020, Online, July 5-10, 2020 , Oct 2020
  31. Efficient Context and Schema Fusion Networks for Multi-Domain Dialogue State Tracking
    Su Zhu , Jieyu Li , Lu Chen, and Kai Yu
    In Findings of the Association for Computational Linguistics: EMNLP 2020, Online Event, 16-20 November 2020 , Oct 2020
  32. Duration Robust Weakly Supervised Sound Event Detection
    Heinrich Dinkel , and Kai Yu
    In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
  33. Investigation of Specaugment for Deep Speaker Embedding Learning
    Shuai Wang , Johan Rohdin , Oldrich Plchot , Lukás Burget , Kai Yu, and Jan Cernocký
    In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
  34. Speaker Augmentation for Low Resource Speech Recognition
    Chenpeng Du , and Kai Yu
    In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
  35. Neural Lattice Search for Speech Recognition
    Rao Ma , Hao Li , Qi Liu , Lu Chen, and Kai Yu
    In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
  36. A Hierarchical Tracker for Multi-Domain Dialogue State Tracking
    Jieyu Li , Su Zhu , and Kai Yu
    In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
  37. Addressing the Polysemy Problem in Language Modeling with Attentional Multi-Sense Embeddings
    Rao Ma , Lesheng Jin , Qi Liu , Lu Chen, and Kai Yu
    In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
  38. CODA: Improving Resource Utilization by Slimming and Co-locating DNN and CPU Jobs
    Han Zhao , Weihao Cui , Quan Chen , Jingwen Leng , Kai Yu, Deze Zeng , Chao Li , and Minyi Guo
    In 40th IEEE International Conference on Distributed Computing Systems, ICDCS 2020, Singapore, November 29 - December 1, 2020 , Oct 2020
  39. Jointly Encoding Word Confusion Network and Dialogue Context with BERT for Spoken Language Understanding
    Chen Liu , Su Zhu , Zijian Zhao , Ruisheng Cao , Lu Chen, and Kai Yu
    In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
  40. Memory Attention Neural Network for Multi-domain Dialogue State Tracking
    Zihan Xu , Zhi Chen , Lu Chen , Su Zhu , and Kai Yu
    In Natural Language Processing and Chinese Computing - 9th CCF International Conference, NLPCC 2020, Zhengzhou, China, October 14-18, 2020, Proceedings, Part I , Oct 2020
  41. Robust Spoken Language Understanding with RL-Based Value Error Recovery
    Chen Liu , Su Zhu , Lu Chen, and Kai Yu
    In Natural Language Processing and Chinese Computing - 9th CCF International Conference, NLPCC 2020, Zhengzhou, China, October 14-18, 2020, Proceedings, Part I , Oct 2020
  42. An Investigation on Different Underlying Quantization Schemes for Pre-trained Language Models
    Zihan Zhao , Yuncong Liu , Lu Chen, Qi Liu , Rao Ma , and Kai Yu
    In Natural Language Processing and Chinese Computing - 9th CCF International Conference, NLPCC 2020, Zhengzhou, China, October 14-18, 2020, Proceedings, Part I , Oct 2020
  43. An Investigation on Deep Learning with Beta Stabilizer
    Qi Liu , Tian Tan , and Kai Yu
    CoRR, Oct 2020
  44. Vector Projection Network for Few-shot Slot Tagging in Natural Language Understanding
    Su Zhu , Ruisheng Cao , Lu Chen, and Kai Yu
    CoRR, Oct 2020
  45. Deep Reinforcement Learning for On-line Dialogue State Tracking
    Zhi Chen , Lu Chen, Xiang Zhou , and Kai Yu
    CoRR, Oct 2020
  46. Structured Hierarchical Dialogue Policy with Graph Neural Networks
    Zhi Chen , Xiaoyuan Liu , Lu Chen, and Kai Yu
    CoRR, Oct 2020
  47. Dual Learning for Dialogue State Tracking
    Zhi Chen , Lu Chen, Yanbin Zhao , Su Zhu , and Kai Yu
    CoRR, Oct 2020
  48. CREDIT: Coarse-to-Fine Sequence Generation for Dialogue State Tracking
    Zhi Chen , Lu Chen, Zihan Xu , Yanbin Zhao , Su Zhu , and Kai Yu
    CoRR, Oct 2020

2019

  1. Erratum to: Past review, current progress, and challenges ahead on the cocktail party problem
    Yanmin Qian , Chao Weng , Xuankai Chang , Shuai Wang , and Dong Yu
    Frontiers Inf. Technol. Electron. Eng., Oct 2019
  2. Binary neural networks for speech recognition
    Yanmin Qian , and Xu Xiang
    Frontiers Inf. Technol. Electron. Eng., Oct 2019
  3. Data augmentation using generative adversarial networks for robust speech recognition
    Yanmin Qian , Hu Hu , and Tian Tan
    Speech Commun., Oct 2019
  4. Discriminative Neural Embedding Learning for Short-Duration Text-Independent Speaker Verification
    Shuai Wang , Zili Huang , Yanmin Qian , and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2019
  5. Margin Matters: Towards More Discriminative Deep Neural Network Embeddings for Speaker Recognition
    Xu Xiang , Shuai Wang , Houjun Huang , Yanmin Qian , and Kai Yu
    In 2019 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference, APSIPA ASC 2019, Lanzhou, China, November 18-21, 2019 , Oct 2019
  6. GANs for Children: A Generative Data Augmentation Strategy for Children Speech Recognition
    Peiyao Sheng , Zhuolin Yang , and Yanmin Qian
    In IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2019, Singapore, December 14-18, 2019 , Oct 2019
  7. MIMO-Speech: End-to-End Multi-Channel Multi-Speaker Speech Recognition
    Xuankai Chang , Wangyou Zhang , Yanmin Qian , Jonathan Le Roux , and Shinji Watanabe
    In IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2019, Singapore, December 14-18, 2019 , Oct 2019
  8. Exploring Model Units and Training Strategies for End-to-End Speech Recognition
    Mingkun Huang , Yizhou Lu , Lan Wang , Yanmin Qian , and Kai Yu
    In IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2019, Singapore, December 14-18, 2019 , Oct 2019
  9. End-to-End Overlapped Speech Detection and Speaker Counting with Raw Waveform
    Wangyou Zhang , Man Sun , Lan Wang , and Yanmin Qian
    In IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2019, Singapore, December 14-18, 2019 , Oct 2019
  10. Knowledge Distillation for Small Foot-print Deep Speaker Embedding
    Shuai Wang , Yexin Yang , Tianzhe Wang , Yanmin Qian , and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2019, Brighton, United Kingdom, May 12-17, 2019 , Oct 2019
  11. End-to-end Monaural Multi-speaker ASR System without Pretraining
    Xuankai Chang , Yanmin Qian , Kai Yu, and Shinji Watanabe
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2019, Brighton, United Kingdom, May 12-17, 2019 , Oct 2019
  12. The SJTU Robust Anti-Spoofing System for the ASVspoof 2019 Challenge
    Yexin Yang , Hongji Wang , Heinrich Dinkel , Zhengyang Chen , Shuai Wang , Yanmin Qian , and Kai Yu
    In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
  13. On the Usage of Phonetic Information for Text-Independent Speaker Embedding Extraction
    Shuai Wang , Johan Rohdin , Lukás Burget , Oldrich Plchot , Yanmin Qian , Kai Yu, and Jan Cernocký
    In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
  14. Data Augmentation Using Variational Autoencoder for Embedding Based Speaker Verification
    Zhanghao Wu , Shuai Wang , Yanmin Qian , and Kai Yu
    In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
  15. Joint Decoding of CTC Based Systems for Speech Recognition
    Jiaqi Guo , Yongbin You , Yanmin Qian , and Kai Yu
    In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
  16. Knowledge Distillation for End-to-End Monaural Multi-Talker ASR System
    Wangyou Zhang , Xuankai Chang , and Yanmin Qian
    In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
  17. Robust DOA Estimation Based on Convolutional Neural Network and Time-Frequency Masking
    Wangyou Zhang , Ying Zhou , and Yanmin Qian
    In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
  18. Cross-Domain Replay Spoofing Attack Detection Using Domain Adversarial Training
    Hongji Wang , Heinrich Dinkel , Shuai Wang , Yanmin Qian , and Kai Yu
    In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
  19. Prosody Usage Optimization for Children Speech Recognition with Zero Resource Children Speech
    Chenda Li , and Yanmin Qian
    In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
  20. Audio Caption: Listen and Tell
    Mengyue Wu, Heinrich Dinkel , and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2019, Brighton, United Kingdom, May 12-17, 2019 , Oct 2019
  21. Text-based Depression Detection: What Triggers An Alert
    Heinrich Dinkel , Mengyue Wu, and Kai Yu
    CoRR, Oct 2019
  22. What does a Car-ssette tape tell?
    Xuenan Xu , Heinrich Dinkel , Mengyue Wu, and Kai Yu
    CoRR, Oct 2019
  23. AgentGraph: Toward Universal Dialogue Management With Structured Deep Reinforcement Learning
    Lu Chen , Zhi Chen , Bowen Tan , Sishan Long , Milica Gasic , and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2019
  24. Semantic Parsing with Dual Learning
    Ruisheng Cao , Su Zhu , Chen Liu , Jieyu Li , and Kai Yu
    In Proceedings of the 57th Conference of the Association for Computational Linguistics, ACL 2019, Florence, Italy, July 28- August 2, 2019, Volume 1: Long Papers , Oct 2019
  25. Highly Efficient Neural Network Language Model Compression Using Soft Binarization Training
    Rao Ma , Qi Liu , and Kai Yu
    In IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2019, Singapore, December 14-18, 2019 , Oct 2019
  26. Data Augmentation with Atomic Templates for Spoken Language Understanding
    Zijian Zhao , Su Zhu , and Kai Yu
    In Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing and the 9th International Joint Conference on Natural Language Processing, EMNLP-IJCNLP 2019, Hong Kong, China, November 3-7, 2019 , Oct 2019
  27. A Hierarchical Decoding Model for Spoken Language Understanding from Unaligned Data
    Zijian Zhao , Su Zhu , and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2019, Brighton, United Kingdom, May 12-17, 2019 , Oct 2019
  28. CATSLU: The 1st Chinese Audio-Textual Spoken Language Understanding Challenge
    Su Zhu , Zijian Zhao , Tiejun Zhao , Chengqing Zong , and Kai Yu
    In International Conference on Multimodal Interaction, ICMI 2019, Suzhou, China, October 14-18, 2019 , Oct 2019
  29. Robust Spoken Language Understanding with Acoustic and Domain Knowledge
    Hao Li , Chen Liu , Su Zhu , and Kai Yu
    In International Conference on Multimodal Interaction, ICMI 2019, Suzhou, China, October 14-18, 2019 , Oct 2019
  30. Cross Aggregation of Multi-head Attention for Neural Machine Translation
    Juncheng Cao , Hai Zhao , and Kai Yu
    In Natural Language Processing and Chinese Computing - 8th CCF International Conference, NLPCC 2019, Dunhuang, China, October 9-14, 2019, Proceedings, Part I , Oct 2019
  31. International Conference on Multimodal Interaction, ICMI 2019, Suzhou, China, October 14-18, 2019
    Oct 2019

2018

  1. Past review, current progress, and challenges ahead on the cocktail party problem
    Yanmin Qian , Chao Weng , Xuankai Chang , Shuai Wang , and Dong Yu
    Frontiers Inf. Technol. Electron. Eng., Oct 2018
  2. Erratum to: Past review, current progress, and challenges ahead on the cocktail party problem
    Yanmin Qian , Chao Weng , Xuankai Chang , Shuai Wang , and Dong Yu
    Frontiers Inf. Technol. Electron. Eng., Oct 2018
  3. Sequence discriminative training for deep learning based acoustic keyword spotting
    Zhehuai Chen , Yanmin Qian , and Kai Yu
    Speech Commun., Oct 2018
  4. Single-channel multi-talker speech recognition with permutation invariant training
    Yanmin Qian , Xuankai Chang , and Dong Yu
    Speech Commun., Oct 2018
  5. Adaptive Very Deep Convolutional Residual Network for Noise Robust Speech Recognition
    Tian Tan , Yanmin Qian , Hu Hu , Ying Zhou , Wen Ding , and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2018
  6. Investigating Raw Wave Deep Neural Networks for End-to-End Speaker Spoofing Detection
    Heinrich Dinkel , Yanmin Qian , and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2018
  7. Robust Mask Estimation By Integrating Neural Network-Based and Clustering-Based Approaches for Adaptive Acoustic Beamforming
    Ying Zhou , and Yanmin Qian
    In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
  8. Knowledge Transfer in Permutation Invariant Training for Single-Channel Multi-Talker Speech Recognition
    Tian Tan , Yanmin Qian , and Dong Yu
    In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
  9. Joint I-Vector with End-to-End System for Short Duration Text-Independent Speaker Verification
    Zili Huang , Shuai Wang , and Yanmin Qian
    In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
  10. Generative Adversarial Networks Based Data Augmentation for Noise Robust Speech Recognition
    Hu Hu , Tian Tan , and Yanmin Qian
    In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
  11. Focal Kl-Divergence Based Dilated Convolutional Neural Networks for Co-Channel Speaker Identification
    Shuai Wang , Yanmin Qian , and Kai Yu
    In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
  12. Noise Robust Speech Recognition on Aurora4 by Humans and Machines
    Yanmin Qian , Tian Tan , Hu Hu , and Qi Liu
    In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
  13. Fast Adaptation on Deepmixture Generative Network Based Acoustic Modeling
    Wen Ding , Tian Tan , and Yanmin Qian
    In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
  14. Adaptive Permutation Invariant Training with Auxiliary Information for Monaural Multi-Talker Speech Recognition
    Xuankai Chang , Yanmin Qian , and Dong Yu
    In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
  15. Permutation Invariant Training of Generative Adversarial Network for Monaural Speech Separation
    Lianwu Chen , Meng Yu , Yanmin Qian , Dan Su , and Dong Yu
    In Interspeech 2018, 19th Annual Conference of the International Speech Communication Association, Hyderabad, India, 2-6 September 2018 , Oct 2018
  16. Deep Extractor Network for Target Speaker Recovery from Single Channel Speech Mixtures
    Jun Wang , Jie Chen , Dan Su , Lianwu Chen , Meng Yu , Yanmin Qian , and Dong Yu
    In Interspeech 2018, 19th Annual Conference of the International Speech Communication Association, Hyderabad, India, 2-6 September 2018 , Oct 2018
  17. Monaural Multi-Talker Speech Recognition with Attention Mechanism and Gated Convolutional Networks
    Xuankai Chang , Yanmin Qian , and Dong Yu
    In Interspeech 2018, 19th Annual Conference of the International Speech Communication Association, Hyderabad, India, 2-6 September 2018 , Oct 2018
  18. Knowledge Distillation for Sequence Model
    Mingkun Huang , Yongbin You , Zhehuai Chen , Yanmin Qian , and Kai Yu
    In Interspeech 2018, 19th Annual Conference of the International Speech Communication Association, Hyderabad, India, 2-6 September 2018 , Oct 2018
  19. Covariance Based Deep Feature for Text-Dependent Speaker Verification
    Shuai Wang , Heinrich Dinkel , Yanmin Qian , and Kai Yu
    In Intelligence Science and Big Data Engineering - 8th International Conference, IScIDE 2018, Lanzhou, China, August 18-19, 2018, Revised Selected Papers , Oct 2018
  20. Data Augmentation using Conditional Generative Adversarial Networks for Robust Speech Recognition
    Peiyao Sheng , Zhuolin Yang , Hu Hu , Tian Tan , and Yanmin Qian
    In 11th International Symposium on Chinese Spoken Language Processing, ISCSLP 2018, Taipei City, Taiwan, November 26-29, 2018 , Oct 2018
  21. Deep Discriminant Analysis for i-vector Based Robust Speaker Recognition
    Shuai Wang , Zili Huang , Yanmin Qian , and Kai Yu
    In 11th International Symposium on Chinese Spoken Language Processing, ISCSLP 2018, Taipei City, Taiwan, November 26-29, 2018 , Oct 2018
  22. Generative Adversarial Networks based X-vector Augmentation for Robust Probabilistic Linear Discriminant Analysis in Speaker Verification
    Yexin Yang , Shuai Wang , Man Sun , Yanmin Qian , and Kai Yu
    In 11th International Symposium on Chinese Spoken Language Processing, ISCSLP 2018, Taipei City, Taiwan, November 26-29, 2018 , Oct 2018
  23. Rich Short Text Conversation Using Semantic-Key-Controlled Sequence Generation
    Kai Yu, Zijian Zhao , Xueyang Wu , Hongtao Lin , and Xuan Liu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2018
  24. Structured Dialogue Policy with Graph Neural Networks
    Lu Chen, Bowen Tan , Sishan Long , and Kai Yu
    In Proceedings of the 27th International Conference on Computational Linguistics, COLING 2018, Santa Fe, New Mexico, USA, August 20-26, 2018 , Oct 2018
  25. Towards Universal Dialogue State Tracking
    Liliang Ren , Kaige Xie , Lu Chen, and Kai Yu
    In Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing, Brussels, Belgium, October 31 - November 4, 2018 , Oct 2018
  26. On Modular Training of Neural Acoustics-to-Word Model for LVCSR
    Zhehuai Chen , Qi Liu , Hao Li , and Kai Yu
    In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
  27. Semi-Supervised Training Using Adversarial Multi-Task Learning for Spoken Language Understanding
    Ouyu Lan , Su Zhu , and Kai Yu
    In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
  28. Policy Adaptation for Deep Reinforcement Learning-Based Dialogue Management
    Lu Chen, Cheng Chang , Zhi Chen , Bowen Tan , Milica Gasic , and Kai Yu
    In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
  29. Robust Spoken Language Understanding with Unsupervised ASR-Error Adaptation
    Su Zhu , Ouyu Lan , and Kai Yu
    In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
  30. MLN: Moment localization Network and Samples Selection for Moment Retrieval
    Bo Huang , Ya Zhang , and Kai Yu
    In Proceedings of the 2nd International Conference on Video and Image Processing, ICVIP 2018, Hong Kong, China, December 29-31, 2018 , Oct 2018
  31. Angular Softmax for Short-Duration Text-independent Speaker Verification
    Zili Huang , Shuai Wang , and Kai Yu
    In Interspeech 2018, 19th Annual Conference of the International Speech Communication Association, Hyderabad, India, 2-6 September 2018 , Oct 2018
  32. Joint Spoken Language Understanding and Domain Adaptive Language Modeling
    Huifeng Zhang , Su Zhu , Shuai Fan , and Kai Yu
    In Intelligence Science and Big Data Engineering - 8th International Conference, IScIDE 2018, Lanzhou, China, August 18-19, 2018, Revised Selected Papers , Oct 2018
  33. Binarized LSTM Language Model
    Xuan Liu , Di Cao , and Kai Yu
    In Proceedings of the 2018 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, NAACL-HLT 2018, New Orleans, Louisiana, USA, June 1-6, 2018, Volume 1 (Long Papers) , Oct 2018
  34. Cost-Sensitive Active Learning for Dialogue State Tracking
    Kaige Xie , Cheng Chang , Liliang Ren , Lu Chen, and Kai Yu
    In Proceedings of the 19th Annual SIGdial Meeting on Discourse and Dialogue, Melbourne, Australia, July 12-14, 2018 , Oct 2018
  35. Concept Transfer Learning for Adaptive Language Understanding
    Su Zhu , and Kai Yu
    In Proceedings of the 19th Annual SIGdial Meeting on Discourse and Dialogue, Melbourne, Australia, July 12-14, 2018 , Oct 2018
  36. Intelligence Science and Big Data Engineering - 8th International Conference, IScIDE 2018, Lanzhou, China, August 18-19, 2018, Revised Selected Papers
    Oct 2018

2017

  1. Phone Synchronous Speech Recognition With CTC Lattices
    Zhehuai Chen , Yimeng Zhuang , Yanmin Qian , and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2017
  2. Deep Feature Engineering for Noise Robust Spoofing Detection
    Yanmin Qian , Nanxin Chen , Heinrich Dinkel , and Zhizheng Wu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2017
  3. Integrating online i-vector into GMM-UBM for text-dependent speaker verification
    Xiaowei Jiang , Shuai Wang , Xu Xiang , and Yanmin Qian
    In 2017 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference, APSIPA ASC 2017, Kuala Lumpur, Malaysia, December 12-15, 2017 , Oct 2017
  4. Future vector enhanced LSTM language model for LVCSR
    Qi Liu , Yanmin Qian , and Kai Yu
    In 2017 IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2017, Okinawa, Japan, December 16-20, 2017 , Oct 2017
  5. Multi-view LSTM Language Model with Word-Synchronized Auxiliary Feature for LVCSR
    Yue Wu , Tianxing He , Zhehuai Chen , Yanmin Qian , and Kai Yu
    In Chinese Computational Linguistics and Natural Language Processing Based on Naturally Annotated Big Data - 16th China National Conference, CCL 2017, - and - 5th International Symposium, NLP-NABD 2017, Nanjing, China, October 13-15, 2017, Proceedings , Oct 2017
  6. End-to-end spoofing detection with raw waveform CLDNNS
    Heinrich Dinkel , Nanxin Chen , Yanmin Qian , and Kai Yu
    In 2017 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2017, New Orleans, LA, USA, March 5-9, 2017 , Oct 2017
  7. Small-footprint convolutional neural network for spoofing detection
    Heinrich Dinkel , Yanmin Qian , and Kai Yu
    In 2017 International Joint Conference on Neural Networks, IJCNN 2017, Anchorage, AK, USA, May 14-19, 2017 , Oct 2017
  8. Binary Deep Neural Networks for Speech Recognition
    Xu Xiang , Yanmin Qian , and Kai Yu
    In Interspeech 2017, 18th Annual Conference of the International Speech Communication Association, Stockholm, Sweden, August 20-24, 2017 , Oct 2017
  9. What Does the Speaker Embedding Encode?
    Shuai Wang , Yanmin Qian , and Kai Yu
    In Interspeech 2017, 18th Annual Conference of the International Speech Communication Association, Stockholm, Sweden, August 20-24, 2017 , Oct 2017
  10. Recognizing Multi-Talker Speech with Permutation Invariant Training
    Dong Yu , Xuankai Chang , and Yanmin Qian
    In Interspeech 2017, 18th Annual Conference of the International Speech Communication Association, Stockholm, Sweden, August 20-24, 2017 , Oct 2017
  11. A Unified Confidence Measure Framework Using Auxiliary Normalization Graph
    Zhehuai Chen , Yanmin Qian , and Kai Yu
    In Intelligence Science and Big Data Engineering - 7th International Conference, IScIDE 2017, Dalian, China, September 22-23, 2017, Proceedings , Oct 2017
  12. Adaptation of Deep Neural Network Acoustic Models for Robust Automatic Speech Recognition
    Khe Chai Sim , Yanmin Qian , Gautam Mantena , Lahiru Samarakoon , Souvik Kundu , and Tian Tan
    In New Era for Robust Speech Recognition, Exploiting Deep Learning , Oct 2017
  13. On-line Dialogue Policy Learning with Companion Teaching
    Lu Chen, Runzhe Yang , Cheng Chang , Zihao Ye , Xiang Zhou , and Kai Yu
    In Proceedings of the 15th Conference of the European Chapter of the Association for Computational Linguistics, EACL 2017, Valencia, Spain, April 3-7, 2017, Volume 2: Short Papers , Oct 2017
  14. Affordable On-line Dialogue Policy Learning
    Cheng Chang , Runzhe Yang , Lu Chen, Xiang Zhou , and Kai Yu
    In Proceedings of the 2017 Conference on Empirical Methods in Natural Language Processing, EMNLP 2017, Copenhagen, Denmark, September 9-11, 2017 , Oct 2017
  15. Agent-Aware Dropout DQN for Safe and Efficient On-line Dialogue Policy Learning
    Lu Chen, Xiang Zhou , Cheng Chang , Runzhe Yang , and Kai Yu
    In Proceedings of the 2017 Conference on Empirical Methods in Natural Language Processing, EMNLP 2017, Copenhagen, Denmark, September 9-11, 2017 , Oct 2017
  16. Confidence measures for CTC-based phone synchronous decoding
    Zhehuai Chen , Yimeng Zhuang , and Kai Yu
    In 2017 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2017, New Orleans, LA, USA, March 5-9, 2017 , Oct 2017
  17. Encoder-decoder with focus-mechanism for sequence labelling based spoken language understanding
    Su Zhu , and Kai Yu
    In 2017 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2017, New Orleans, LA, USA, March 5-9, 2017 , Oct 2017
  18. Discrete Duration Model for Speech Synthesis
    Bo Chen , Tianling Bian , and Kai Yu
    In Interspeech 2017, 18th Annual Conference of the International Speech Communication Association, Stockholm, Sweden, August 20-24, 2017 , Oct 2017
  19. Deep Attentive Structured Language Model Based on LSTM
    Di Cao , and Kai Yu
    In Intelligence Science and Big Data Engineering - 7th International Conference, IScIDE 2017, Dalian, China, September 22-23, 2017, Proceedings , Oct 2017
  20. splab at the NTCIR-13 STC-2 Task
    Xuan Liu , Xueyang Wu , Ruinian Chen , Zijian Zhao , Hongtao Lin , and Kai Yu
    In The 13th NTCIR Conference, Evaluation of Information Access Technologies, National Center of Sciences, Tokyo, Japan, December 5-8, 2017 , Oct 2017

2016

  1. Deep features for automatic spoofing detection
    Yanmin Qian , Nanxin Chen , and Kai Yu
    Speech Commun., Oct 2016
  2. Cluster Adaptive Training for Deep Neural Network Based Acoustic Model
    Tian Tan , Yanmin Qian , and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2016
  3. Neural Network Based Multi-Factor Aware Joint Training for Robust Speech Recognition
    Yanmin Qian , Tian Tan , and Dong Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2016
  4. Very Deep Convolutional Neural Networks for Noise Robust Speech Recognition
    Yanmin Qian , Mengxiao Bi , Tian Tan , and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2016
  5. Overview of BTAS 2016 speaker anti-spoofing competition
    Pavel Korshunov , Sébastien Marcel , Hannah Muckenhirn , André R. Gonçalves , A. G. Souza Mello , Ricardo Paranhos Velloso Violato , Flávio Olmos Simões , M. U. Neto , Marcus Assis Angeloni , José Augusto Stuchi , Heinrich Dinkel , Nanxin Chen , Yanmin Qian , Dipjyoti Paul , Goutam Saha , and Md. Sahidullah
    In 8th IEEE International Conference on Biometrics Theory, Applications and Systems, BTAS 2016, Niagara Falls, NY, USA, September 6-9, 2016 , Oct 2016
  6. Joint acoustic factor learning for robust deep neural network based automatic speech recognition
    Souvik Kundu , Gautam Mantena , Yanmin Qian , Tian Tan , Marc Delcroix , and Khe Chai Sim
    In 2016 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2016, Shanghai, China, March 20-25, 2016 , Oct 2016
  7. Speaker-aware training of LSTM-RNNS for acoustic modelling
    Tian Tan , Yanmin Qian , Dong Yu , Souvik Kundu , Liang Lu , Khe Chai Sim , Xiong Xiao , and Yu Zhang
    In 2016 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2016, Shanghai, China, March 20-25, 2016 , Oct 2016
  8. Improved DNN-based segmentation for multi-genre broadcast audio
    Linlin Wang , Chao Zhang , Philip C. Woodland , Mark J. F. Gales , Panagiota Karanasou , Pierre Lanchantin , Xunying Liu , and Yanmin Qian
    In 2016 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2016, Shanghai, China, March 20-25, 2016 , Oct 2016
  9. An investigation into using parallel data for far-field speech recognition
    Yanmin Qian , Tian Tan , and Dong Yu
    In 2016 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2016, Shanghai, China, March 20-25, 2016 , Oct 2016
  10. Integrated adaptation with multi-factor joint-learning for far-field speech recognition
    Yanmin Qian , Tian Tan , Dong Yu , and Yu Zhang
    In 2016 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2016, Shanghai, China, March 20-25, 2016 , Oct 2016
  11. Unrestricted Vocabulary Keyword Spotting Using LSTM-CTC
    Yimeng Zhuang , Xuankai Chang , Yanmin Qian , and Kai Yu
    In Interspeech 2016, 17th Annual Conference of the International Speech Communication Association, San Francisco, CA, USA, September 8-12, 2016 , Oct 2016
  12. Multi-task joint-learning for robust voice activity detection
    Yimeng Zhuang , Sibo Tong , Maofan Yin , Yanmin Qian , and Kai Yu
    In 10th International Symposium on Chinese Spoken Language Processing, ISCSLP 2016, Tianjin, China, October 17-20, 2016 , Oct 2016
  13. Very deep convolutional neural networks for robust speech recognition
    Yanmin Qian , and Philip C. Woodland
    In 2016 IEEE Spoken Language Technology Workshop, SLT 2016, San Diego, CA, USA, December 13-16, 2016 , Oct 2016
  14. Evolvable dialogue state tracking for statistical dialogue management
    Kai YuLu Chen, Kai Sun , Qizhe Xie , and Su Zhu
    Frontiers Comput. Sci., Oct 2016
  15. Discriminatively trained joint speaker and environment representations for adaptation of deep neural network acoustic models
    Maofan Yin , Sunil Sivadas , Kai Yu, and Bin Ma
    In 2016 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2016, Shanghai, China, March 20-25, 2016 , Oct 2016
  16. A comparative study of robustness of deep learning approaches for VAD
    Sibo Tong , Hao Gu , and Kai Yu
    In 2016 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2016, Shanghai, China, March 20-25, 2016 , Oct 2016
  17. Phone Synchronous Decoding with CTC Lattice
    Zhehuai Chen , Wei Deng , Tao Xu , and Kai Yu
    In Interspeech 2016, 17th Annual Conference of the International Speech Communication Association, San Francisco, CA, USA, September 8-12, 2016 , Oct 2016
  18. Hybrid Dialogue State Tracking for Real World Human-to-Human Dialogues
    Kai Sun , Su Zhu , Lu Chen, Siqiu Yao , Xueyang Wu , and Kai Yu
    In Interspeech 2016, 17th Annual Conference of the International Speech Communication Association, San Francisco, CA, USA, September 8-12, 2016 , Oct 2016
  19. On training bi-directional neural network language model with noise contrastive estimation
    Tianxing He , Yu Zhang , Jasha Droppo , and Kai Yu
    In 10th International Symposium on Chinese Spoken Language Processing, ISCSLP 2016, Tianjin, China, October 17-20, 2016 , Oct 2016
  20. Rich punctuations prediction using large-scale deep learning
    Xueyang Wu , Su Zhu , Yue Wu , and Kai Yu
    In 10th International Symposium on Chinese Spoken Language Processing, ISCSLP 2016, Tianjin, China, October 17-20, 2016 , Oct 2016
  21. Directed automatic speech transcription error correction using bidirectional LSTM
    Da Zheng , Zhehuai Chen , Yue Wu , and Kai Yu
    In 10th International Symposium on Chinese Spoken Language Processing, ISCSLP 2016, Tianjin, China, October 17-20, 2016 , Oct 2016
  22. The splab at the NTCIR-12 Short Text Conversation Task
    Ke Wu , Xuan Liu , and Kai Yu
    In Proceedings of the 12th NTCIR Conference on Evaluation of Information Access Technologies, National Center of Sciences, Tokyo, Japan, June 7-10, 2016 , Oct 2016

2015

  1. Deep feature for text-dependent speaker verification
    Yuan Liu , Yanmin Qian , Nanxin Chen , Tianfan Fu , Ya Zhang , and Kai Yu
    Speech Commun., Oct 2015
  2. Multi-task joint-learning of deep neural networks for robust speech recognition
    Yanmin Qian , Maofan Yin , Yongbin You , and Kai Yu
    In 2015 IEEE Workshop on Automatic Speech Recognition and Understanding, ASRU 2015, Scottsdale, AZ, USA, December 13-17, 2015 , Oct 2015
  3. Cambridge university transcription systems for the multi-genre broadcast challenge
    Philip C. Woodland , Xunying Liu , Yanmin Qian , Chao Zhang , Mark J. F. Gales , Penny Karanasou , Pierre Lanchantin , and Linlin Wang
    In 2015 IEEE Workshop on Automatic Speech Recognition and Understanding, ASRU 2015, Scottsdale, AZ, USA, December 13-17, 2015 , Oct 2015
  4. The development of the cambridge university alignment systems for the multi-genre broadcast challenge
    Pierre Lanchantin , Mark J. F. Gales , Penny Karanasou , Xunying Liu , Yanmin Qian , Linlin Wang , Philip C. Woodland , and Chao Zhang
    In 2015 IEEE Workshop on Automatic Speech Recognition and Understanding, ASRU 2015, Scottsdale, AZ, USA, December 13-17, 2015 , Oct 2015
  5. Speaker diarisation and longitudinal linking in multi-genre broadcast data
    Penny Karanasou , Mark J. F. Gales , Pierre Lanchantin , Xunying Liu , Yanmin Qian , Linlin Wang , Philip C. Woodland , and Chao Zhang
    In 2015 IEEE Workshop on Automatic Speech Recognition and Understanding, ASRU 2015, Scottsdale, AZ, USA, December 13-17, 2015 , Oct 2015
  6. Local trajectory based speech enhancement for robust speech recognition with deep neural network
    Yongbin You , Yanmin Qian , and Kai Yu
    In IEEE China Summit and International Conference on Signal and Information Processing, ChinaSIP 2015, Chengdu, China, July 12-15, 2015 , Oct 2015
  7. An investigation on DNN-derived bottleneck features for GMM-HMM based robust speech recognition
    Yongbin You , Yanmin Qian , Tianxing He , and Kai Yu
    In IEEE China Summit and International Conference on Signal and Information Processing, ChinaSIP 2015, Chengdu, China, July 12-15, 2015 , Oct 2015
  8. Cluster adaptive training for deep neural network
    Tian Tan , Yanmin Qian , Maofan Yin , Yimeng Zhuang , and Kai Yu
    In 2015 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2015, South Brisbane, Queensland, Australia, April 19-24, 2015 , Oct 2015
  9. A novel static parameter calculation method for model compensation
    Suliang Bu , Yunxin Zhao , Yanmin Qian , and Kai Yu
    In 2015 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2015, South Brisbane, Queensland, Australia, April 19-24, 2015 , Oct 2015
  10. Recurrent neural network language model with structured word embeddings for speech recognition
    Tianxing He , Xu Xiang , Yanmin Qian , and Kai Yu
    In 2015 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2015, South Brisbane, Queensland, Australia, April 19-24, 2015 , Oct 2015
  11. Automatic model redundancy reduction for fast back-propagation for deep neural networks in speech recognition
    Yanmin Qian , Tianxing He , Wei Deng , and Kai Yu
    In 2015 International Joint Conference on Neural Networks, IJCNN 2015, Killarney, Ireland, July 12-17, 2015 , Oct 2015
  12. Multi-task learning for text-dependent speaker verification
    Nanxin Chen , Yanmin Qian , and Kai Yu
    In INTERSPEECH 2015, 16th Annual Conference of the International Speech Communication Association, Dresden, Germany, September 6-10, 2015 , Oct 2015
  13. Robust deep feature for spoofing detection - the SJTU system for ASVspoof 2015 challenge
    Nanxin Chen , Yanmin Qian , Heinrich Dinkel , Bo Chen , and Kai Yu
    In INTERSPEECH 2015, 16th Annual Conference of the International Speech Communication Association, Dresden, Germany, September 6-10, 2015 , Oct 2015
  14. Very deep convolutional neural networks for LVCSR
    Mengxiao Bi , Yanmin Qian , and Kai Yu
    In INTERSPEECH 2015, 16th Annual Conference of the International Speech Communication Association, Dresden, Germany, September 6-10, 2015 , Oct 2015
  15. Paragraph vector based topic model for language model adaptation
    Wengong Jin , Tianxing He , Yanmin Qian , and Kai Yu
    In INTERSPEECH 2015, 16th Annual Conference of the International Speech Communication Association, Dresden, Germany, September 6-10, 2015 , Oct 2015
  16. Constrained Markov Bayesian Polynomial for Efficient Dialogue State Tracking
    Kai Yu, Kai Sun , Lu Chen , and Su Zhu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2015
  17. An investigation of context clustering for statistical speech synthesis with deep neural network
    Bo Chen , Zhehuai Chen , Jiachen Xu , and Kai Yu
    In INTERSPEECH 2015, 16th Annual Conference of the International Speech Communication Association, Dresden, Germany, September 6-10, 2015 , Oct 2015
  18. Recurrent Polynomial Network for Dialogue State Tracking with Mismatched Semantic Parsers
    Qizhe Xie , Kai Sun , Su Zhu , Lu Chen, and Kai Yu
    In Proceedings of the SIGDIAL 2015 Conference, The 16th Annual Meeting of the Special Interest Group on Discourse and Dialogue, 2-4 September 2015, Prague, Czech Republic , Oct 2015
  19. Hyper-parameter Optimisation of Gaussian Process Reinforcement Learning for Statistical Dialogue Management
    Lu Chen, Pei-Hao Su , and Milica Gasic
    In Proceedings of the SIGDIAL 2015 Conference, The 16th Annual Meeting of the Special Interest Group on Discourse and Dialogue, 2-4 September 2015, Prague, Czech Republic , Oct 2015

2014

  1. Stochastic data sweeping for fast DNN training
    Wei Deng , Yanmin Qian , Yuchen Fan , Tianfan Fu , and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2014, Florence, Italy, May 4-9, 2014 , Oct 2014
  2. Reshaping deep neural network for fast decoding by node-pruning
    Tianxing He , Yuchen Fan , Yanmin Qian , Tian Tan , and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2014, Florence, Italy, May 4-9, 2014 , Oct 2014
  3. Second order vector taylor series based robust speech recognition
    Suliang Bu , Yanmin Qian , Khe Chai Sim , Yongbin You , and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2014, Florence, Italy, May 4-9, 2014 , Oct 2014
  4. Speaker verification with deep features
    Yuan Liu , Tianfan Fu , Yuchen Fan , Yanmin Qian , and Kai Yu
    In 2014 International Joint Conference on Neural Networks, IJCNN 2014, Beijing, China, July 6-11, 2014 , Oct 2014
  5. Tandem deep features for text-dependent speaker verification
    Tianfan Fu , Yanmin Qian , Yuan Liu , and Kai Yu
    In INTERSPEECH 2014, 15th Annual Conference of the International Speech Communication Association, Singapore, September 14-18, 2014 , Oct 2014
  6. A novel dynamic parameters calculation approach for model compensation
    Suliang Bu , Yanmin Qian , and Kai Yu
    In INTERSPEECH 2014, 15th Annual Conference of the International Speech Communication Association, Singapore, September 14-18, 2014 , Oct 2014
  7. Acoustic emotion recognition using deep neural network
    Jianwei Niu , Yanmin Qian , and Kai Yu
    In The 9th International Symposium on Chinese Spoken Language Processing, Singapore, September 12-14, 2014 , Oct 2014
  8. The SJTU System for Dialog State Tracking Challenge 2
    Kai Sun , Lu Chen , Su Zhu , and Kai Yu
    In Proceedings of the SIGDIAL 2014 Conference, The 15th Annual Meeting of the Special Interest Group on Discourse and Dialogue, 18-20 June 2014, Philadelphia, PA, USA , Oct 2014
  9. A generalized rule based tracker for dialogue state tracking
    Kai Sun , Lu Chen , Su Zhu , and Kai Yu
    In 2014 IEEE Spoken Language Technology Workshop, SLT 2014, South Lake Tahoe, NV, USA, December 7-10, 2014 , Oct 2014
  10. Semantic parser enhancement for dialogue domain extension with little data
    Su Zhu , Lu Chen, Kai Sun , Da Zheng , and Kai Yu
    In 2014 IEEE Spoken Language Technology Workshop, SLT 2014, South Lake Tahoe, NV, USA, December 7-10, 2014 , Oct 2014

2013

  1. Combination of data borrowing strategies for low-resource LVCSR
    Yanmin Qian , Kai Yu, and Jia Liu
    In 2013 IEEE Workshop on Automatic Speech Recognition and Understanding, Olomouc, Czech Republic, December 8-12, 2013 , Oct 2013
  2. MLP-HMM two-stage unsupervised training for low-resource languages on conversational telephone speech recognition
    Yanmin Qian , and Jia Liu
    In INTERSPEECH 2013, 14th Annual Conference of the International Speech Communication Association, Lyon, France, August 25-29, 2013 , Oct 2013
  3. A New Word Language Model Evaluation Metric for Character Based Languages
    Peilu Wang , Ruihua Sun , Hai Zhao , and Kai Yu
    In Chinese Computational Linguistics and Natural Language Processing Based on Naturally Annotated Big Data - 12th China National Conference, CCL 2013 and First International Symposium, NLP-NABD 2013, Suzhou, China, October 10-12, 2013. Proceedings , Oct 2013

2012

  1. Introduction to the Issue on Advances in Spoken Dialogue Systems and Mobile Interface
    Jason D. Williams , Kai Yu, Brahim Chaib-draa , Oliver Lemon , Roberto Pieraccini , Olivier Pietquin , Pascal Poupart , and Steve J. Young
    IEEE J. Sel. Top. Signal Process., Oct 2012
  2. ICMI’12 grand challenge: haptic voice recognition
    Khe Chai Sim , Shengdong Zhao , Kai Yu, and Hank Liao
    In International Conference on Multimodal Interaction, ICMI ’12, Santa Monica, CA, USA, October 22-26, 2012 , Oct 2012
  3. Development of the 2012 SJTU HVR system
    Hainan Xu , Yuchen Fan , and Kai Yu
    In International Conference on Multimodal Interaction, ICMI ’12, Santa Monica, CA, USA, October 22-26, 2012 , Oct 2012
\ No newline at end of file + 📃Papers | X - LANCE

📃Papers

Publications are listed in reversed chronological order.

2024

  1. Advanced Long-Content Speech Recognition With Factorized Neural Transducer
    Xun Gong , Yu Wu , Jinyu Li , Shujie Liu , Rui Zhao , Xie Chen, and Yanmin Qian
    IEEE ACM Trans. Audio Speech Lang. Process., 2024
  2. EAT: Self-Supervised Pre-Training with Efficient Audio Transformer
    Wenxi Chen , Yuzhe Liang , Ziyang Ma , Zhisheng Zheng , and Xie Chen
    CoRR, 2024
  3. ELLA-V: Stable Neural Codec Language Modeling with Alignment-guided Sequence Reordering
    Yakun Song , Zhuo Chen , Xiaofei Wang , Ziyang Ma , and Xie Chen
    CoRR, 2024
  4. BAT: Learning to Reason about Spatial Sounds with Large Language Models
    Zhisheng Zheng , Puyuan Peng , Ziyang Ma , Xie Chen, Eunsol Choi , and David Harwath
    CoRR, 2024
  5. An Embarrassingly Simple Approach for LLM with Strong ASR Capacity
    Ziyang Ma , Guanrou Yang , Yifan Yang , Zhifu Gao , Jiaming Wang , Zhihao Du , Fan Yu , Qian Chen , Siqi Zheng , Shiliang Zhang , and Xie Chen
    CoRR, 2024
  6. Beyond the Status Quo: A Contemporary Survey of Advances and Challenges in Audio Captioning
    Xuenan Xu , Zeyu Xie , Mengyue Wu, and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., 2024
  7. Towards Weakly Supervised Text-to-Audio Grounding
    Xuenan Xu , Ziyang Ma , Mengyue Wu, and Kai Yu
    CoRR, 2024
  8. VALL-T: Decoder-Only Generative Transducer for Robust and Decoding-Controllable Text-to-Speech
    Chenpeng Du , Yiwei Guo , Hankun Wang , Yifan Yang , Zhikang Niu , Shuai Wang , Hui Zhang , Xie Chen, and Kai Yu
    CoRR, 2024
  9. ChemDFM: Dialogue Foundation Model for Chemistry
    Zihan Zhao , Da Ma , Lu Chen, Liangtai Sun , Zihao Li , Hongshen Xu , Zichen Zhu , Su Zhu , Shuai Fan , Guodong Shen , Xin Chen , and Kai Yu
    CoRR, 2024
  10. MULTI: Multimodal Understanding Leaderboard with Text and Images
    Zichen Zhu, Yang Xu , Lu Chen, Jingkai Yang , Yichuan Ma , Yiming Sun , Hailin Wen , Jiaqi Liu , Jinyu Cai , Yingzi Ma , Situo Zhang , Zihan Zhao , Liangtai Sun , and Kai Yu
    CoRR, 2024

2023

  1. A Unified Framework From Face Image Restoration to Data Augmentation Using Generative Prior
    Jiawei You , Ganyu Huang , Tianyuan Han , Haoze Yang , and Liping Shen
    IEEE Access, 2023
  2. Human Pose Estimation with Combined Feature Maps and Joint Embeddings
    Tianyuan Han , Ganyu Huang , Chunhui Li , and Liping Shen
    In Proceedings of the 2023 International Conference on Advances in Artificial Intelligence and Applications, AAIA 2023, Wuhan, China, November 18-20, 2023 , 2023
  3. Assessing and Enhancing LLMs: A Physics and History Dataset and One-More-Check Pipeline Method
    Chaofan He , Chunhui Li , Tianyuan Han , and Liping Shen
    In Neural Information Processing - 30th International Conference, ICONIP 2023, Changsha, China, November 20-23, 2023, Proceedings, Part XIII , 2023
  4. GAN Latent Space Manipulation Based Augmentation for Unbalanced Emotion Datasets
    Yuhan Xiong , Jiawei You , and Liping Shen
    In International Joint Conference on Neural Networks, IJCNN 2023, Gold Coast, Australia, June 18-23, 2023 , 2023
  5. LongFNT: Long-Form Speech Recognition with Factorized Neural Transducer
    Xun Gong , Yu Wu , Jinyu Li , Shujie Liu , Rui Zhao , Xie Chen, and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
  6. Factorized AED: Factorized Attention-Based Encoder-Decoder for Text-Only Domain Adaptive ASR
    Xun Gong , Wei Wang , Hang Shao , Xie Chen, and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
  7. Exploring Binary Classification Loss for Speaker Verification
    Bing Han , Zhengyang Chen , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
  8. Improving Dino-Based Self-Supervised Speaker Verification with Progressive Cluster-Aware Training
    Bing Han , Wen Huang , Zhengyang Chen , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2023 - Workshops, Rhodes Island, Greece, June 4-10, 2023 , 2023
  9. Robust Audio-Visual ASR with Unified Cross-Modal Attention
    Jiahong Li , Chenda Li , Yifei Wu , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
  10. Target Sound Extraction with Variable Cross-Modality Clues
    Chenda Li , Yao Qian , Zhuo Chen , Dongmei Wang , Takuya Yoshioka , Shujie Liu , Yanmin Qian , and Michael Zeng
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
  11. Predictive Skim: Contrastive Predictive Coding for Low-Latency Online Speech Separation
    Chenda Li , Yifei Wu , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
  12. Multi-Speaker End-to-End Multi-Modal Speaker Diarization System for the MISP 2022 Challenge
    Tao Liu , Zhengyang Chen , Yanmin Qian , and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
  13. Joint Discriminator and Transfer Based Fast Domain Adaptation For End-To-End Speech Recognition
    Hang Shao , Tian Tan , Wei Wang , Xun Gong , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
  14. Lowbit Neural Network Quantization for Speaker Verification
    Haoyu Wang , Bei Liu , Yifei Wu , Zhengyang Chen , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2023 - Workshops, Rhodes Island, Greece, June 4-10, 2023 , 2023
  15. Wespeaker: A Research and Production Oriented Speaker Embedding Learning Toolkit
    Hongji Wang , Chengdong Liang , Shuai Wang , Zhengyang Chen , Binbin Zhang , Xu Xiang , Yanlei Deng , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
  16. HuBERT-AGG: Aggregated Representation Distillation of Hidden-Unit Bert for Robust Speech Recognition
    Wei Wang , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
  17. Light-Weight Visualvoice: Neural Network Quantization On Audio Visual Speech Separation
    Yifei Wu , Chenda Li , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2023 - Workshops, Rhodes Island, Greece, June 4-10, 2023 , 2023
  18. Code-Switching Text Generation and Injection in Mandarin-English ASR
    Haibin Yu , Yuxuan Hu , Yao Qian , Ma Jin , Linquan Liu , Shujie Liu , Yu Shi , Yanmin Qian , Edward Lin , and Michael Zeng
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
  19. Adaptive Large Margin Fine-Tuning For Robust Speaker Verification
    Leying Zhang , Zhengyang Chen , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
  20. ComSL: A Composite Speech-Language Model for End-to-End Speech-to-Text Translation
    Chenyang Le , Yao Qian , Long Zhou , Shujie Liu , Yanmin Qian , Michael Zeng , and Xuedong Huang
    In Advances in Neural Information Processing Systems 36: Annual Conference on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans, LA, USA, December 10 - 16, 2023 , 2023
  21. Exploring the Integration of Speech Separation and Recognition with Self-Supervised Learning Representation
    Yoshiki Masuyama , Xuankai Chang , Wangyou Zhang , Samuele Cornell , Zhong-Qiu Wang , Nobutaka Ono , Yanmin Qian , and Shinji Watanabe
    In IEEE Workshop on Applications of Signal Processing to Audio and Acoustics, WASPAA 2023, New Paltz, NY, USA, October 22-25, 2023 , 2023
  22. Software Design and User Interface of ESPnet-SE++: Speech Enhancement for Robust Speech Processing (espnet-v.202310) (Version 1)
    Yen-Ju Lu , Xuankai Chang , Chenda Li , Wangyou Zhang , Samuele Cornell , Zhaoheng Ni , Yoshiki Masuyama , Brian Yan , Robin Scheibler , Zhong-Qiu Wang , Yu Tsao , Yanmin Qian , and Shinji Watanabe
    Oct 2023
    Accessed on YYYY-MM-DD.
  23. Self-Supervised Learning with Cluster-Aware-DINO for High-Performance Robust Speaker Verification
    Bing Han , Zhengyang Chen , and Yanmin Qian
    CoRR, Oct 2023
  24. Attention-based Encoder-Decoder Network for End-to-End Neural Speaker Diarization with Target Speaker Attractor
    Zhengyang Chen , Bing Han , Shuai Wang , and Yanmin Qian
    CoRR, Oct 2023
  25. Whisper-KDQ: A Lightweight Whisper via Guided Knowledge Distillation and Quantization for Efficient ASR
    Hang Shao , Wei Wang , Bei Liu , Xun Gong , Haoyu Wang , and Yanmin Qian
    CoRR, Oct 2023
  26. Weakly-Supervised Speech Pre-training: A Case Study on Target Speech Recognition
    Wangyou Zhang , and Yanmin Qian
    CoRR, Oct 2023
  27. Adapting Multi-Lingual ASR Models for Handling Multiple Talkers
    Chenda Li , Yao Qian , Zhuo Chen , Naoyuki Kanda , Dongmei Wang , Takuya Yoshioka , Yanmin Qian , and Michael Zeng
    CoRR, Oct 2023
  28. InstructME: An Instruction Guided Music Edit And Remix Framework with Latent Diffusion Models
    Bing Han , Junyu Dai , Xuchen Song , Weituo Hao , Xinyan He , Dong Guo , Jitong Chen , Yuxuan Wang , and Yanmin Qian
    CoRR, Oct 2023
  29. Attention-based Encoder-Decoder End-to-End Neural Diarization with Embedding Enhancer
    Zhengyang Chen , Bing Han , Shuai Wang , and Yanmin Qian
    CoRR, Oct 2023
  30. USED: Universal Speaker Extraction and Diarization
    Junyi Ao , Mehmet Sinan Yildirim , Meng Ge , Shuai Wang , Ruijie Tao , Yanmin Qian , Liqun Deng , Longshuai Xiao , and Haizhou Li
    CoRR, Oct 2023
  31. Leveraging In-the-Wild Data for Effective Self-Supervised Pretraining in Speaker Recognition
    Shuai Wang , Qibing Bai , Qi Liu , Jianwei Yu , Zhengyang Chen , Bing Han , Yanmin Qian , and Haizhou Li
    CoRR, Oct 2023
  32. The second multi-channel multi-party meeting transcription challenge (M2MeT) 2.0): A benchmark for speaker-attributed ASR
    Yuhao Liang , Mohan Shi , Fan Yu , Yangze Li , Shiliang Zhang , Zhihao Du , Qian Chen , Lei Xie , Yanmin Qian , Jian Wu , Zhuo Chen , Kong Aik Lee , Zhijie Yan , and Hui Bu
    CoRR, Oct 2023
  33. Diffusion Conditional Expectation Model for Efficient and Robust Target Speech Extraction
    Leying Zhang , Yao Qian , Linfeng Yu , Heming Wang , Xinkai Wang , Hemin Yang , Long Zhou , Shujie Liu , Yanmin Qian , and Michael Zeng
    CoRR, Oct 2023
  34. Toward Universal Speech Enhancement for Diverse Input Conditions
    Wangyou Zhang , Kohei Saijo , Zhong-Qiu Wang , Shinji Watanabe , and Yanmin Qian
    CoRR, Oct 2023
  35. One-Shot Sensitivity-Aware Mixed Sparsity Pruning for Large Language Models
    Hang Shao , Bei Liu , and Yanmin Qian
    CoRR, Oct 2023
  36. FAT-HuBERT: Front-end Adaptive Training of Hidden-unit BERT for Distortion-Invariant Robust Speech Recognition
    Dongning Yang , Wei Wang , and Yanmin Qian
    CoRR, Oct 2023
  37. Speaker Adaptive Text-to-Speech With Timbre-Normalized Vector-Quantized Feature
    Chenpeng Du , Yiwei Guo , Xie Chen, and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2023
  38. Fast-Hubert: an Efficient Training Framework for Self-Supervised Speech Representation Learning
    Guanrou Yang , Ziyang Ma , Zhisheng Zheng , Yakun Song , Zhikang Niu , and Xie Chen
    In IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2023, Taipei, Taiwan, December 16-20, 2023 , Oct 2023
  39. Improving Few-Shot Learning for Talking Face System with TTS Data Augmentation
    Qi Chen , Ziyang Ma , Tao Liu , Xu Tan , Qu Lu , Kai Yu , and Xie Chen
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , Oct 2023
  40. Front-End Adapter: Adapting Front-End Input of Speech Based Self-Supervised Learning for Speech Recognition
    Xie Chen, Ziyang Ma , Changli Tang , Yujin Wang , and Zhisheng Zheng
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , Oct 2023
  41. Emodiff: Intensity Controllable Emotional Text-to-Speech with Soft-Label Guidance
    Yiwei Guo , Chenpeng Du , Xie Chen, and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , Oct 2023
  42. DAE-Talker: High Fidelity Speech-Driven Talking Face Generation with Diffusion Autoencoder
    Chenpeng Du , Qi Chen , Tianyu He , Xu Tan , Xie ChenKai Yu, Sheng Zhao , and Jiang Bian
    In Proceedings of the 31st ACM International Conference on Multimedia, MM 2023, Ottawa, ON, Canada, 29 October 2023- 3 November 2023 , Oct 2023
  43. Blank-regularized CTC for Frame Skipping in Neural Transducer
    Yifan Yang , Xiaoyu Yang , Liyong Guo , Zengwei Yao , Wei Kang , Fangjun Kuang , Long Lin , Xie Chen, and Daniel Povey
    CoRR, Oct 2023
  44. UniCATS: A Unified Context-Aware Text-to-Speech Framework with Contextual VQ-Diffusion and Vocoding
    Chenpeng Du , Yiwei Guo , Feiyu Shen , Zhijun Liu , Zheng Liang , Xie Chen, Shuai Wang , Hui Zhang , and Kai Yu
    CoRR, Oct 2023
  45. Improving Code-Switching and Named Entity Recognition in ASR with Speech Editing based Data Augmentation
    Zheng Liang , Zheshu Song , Ziyang Ma , Chenpeng Du , Kai Yu , and Xie Chen
    CoRR, Oct 2023
  46. Pushing the Limits of Unsupervised Unit Discovery for SSL Speech Representation
    Ziyang Ma , Zhisheng Zheng , Guanrou Yang , Yu Wang , Chao Zhang , and Xie Chen
    CoRR, Oct 2023
  47. Towards Effective and Compact Contextual Representation for Conformer Transducer Speech Recognition Systems
    Mingyu Cui , Jiawen Kang , Jiajun Deng , Xi Yin , Yutao Xie , Xie Chen, and Xunying Liu
    CoRR, Oct 2023
  48. DSE-TTS: Dual Speaker Embedding for Cross-Lingual Text-to-Speech
    Sen Liu , Yiwei Guo , Chenpeng Du , Xie Chen, and Kai Yu
    CoRR, Oct 2023
  49. Unsupervised Active Learning: Optimizing Labeling Cost-Effectiveness for Automatic Speech Recognition
    Zhisheng Zheng , Ziyang Ma , Yu Wang , and Xie Chen
    CoRR, Oct 2023
  50. VoiceFlow: Efficient Text-to-Speech with Rectified Flow Matching
    Yiwei Guo , Chenpeng Du , Ziyang Ma , Xie Chen, and Kai Yu
    CoRR, Oct 2023
  51. Towards Universal Speech Discrete Tokens: A Case Study for ASR and TTS
    Yifan Yang , Feiyu Shen , Chenpeng Du , Ziyang Ma , Kai Yu, Daniel Povey , and Xie Chen
    CoRR, Oct 2023
  52. Incorporating Class-based Language Model for Named Entity Recognition in Factorized Neural Transducer
    Peng Wang , Yifan Yang , Zheng Liang , Tian Tan , Shiliang Zhang , and Xie Chen
    CoRR, Oct 2023
  53. Improved Factorized Neural Transducer Model For text-only Domain Adaptation
    Junzhe Liu , Jianwei Yu , and Xie Chen
    CoRR, Oct 2023
  54. Leveraging Speech PTM, Text LLM, and Emotional TTS for Speech Emotion Recognition
    Ziyang Ma , Wen Wu , Zhisheng Zheng , Yiwei Guo , Qian Chen , Shiliang Zhang , and Xie Chen
    CoRR, Oct 2023
  55. Acoustic BPE for Speech Generation with Discrete Tokens
    Feiyu Shen , Yiwei Guo , Chenpeng Du , Xie Chen, and Kai Yu
    CoRR, Oct 2023
  56. Expressive TTS Driven by Natural Language Prompts Using Few Human Annotations
    Hanglei Zhang , Yiwei Guo , Sen Liu , Xie Chen, and Kai Yu
    CoRR, Oct 2023
  57. emotion2vec: Self-Supervised Pre-Training for Speech Emotion Representation
    Ziyang Ma , Zhisheng Zheng , Jiaxin Ye , Jinchao Li , Zhifu Gao , Shiliang Zhang , and Xie Chen
    CoRR, Oct 2023
  58. OPAL: Ontology-Aware Pretrained Language Model for End-to-End Task-Oriented Dialogue
    Zhi Chen , Yuncong Liu , Lu Chen , Su Zhu , Mengyue Wu, and Kai Yu
    Trans. Assoc. Comput. Linguistics, Oct 2023
  59. Transcribing Vocal Communications of Domestic Shiba lnu Dogs
    Jieyi Huang , Chunhao Zhang , Mengyue Wu , and Kenny Q. Zhu
    In Findings of the Association for Computational Linguistics: ACL 2023, Toronto, Canada, July 9-14, 2023 , Oct 2023
  60. Detection of Multiple Mental Disorders from Social Media with Two-Stream Psychiatric Experts
    Siyuan Chen , Zhiling Zhang , Mengyue Wu , and Kenny Q. Zhu
    In Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing, EMNLP 2023, Singapore, December 6-10, 2023 , Oct 2023
  61. Semantic Space Grounded Weighted Decoding for Multi-Attribute Controllable Dialogue Generation
    Zhiling Zhang , Mengyue Wu , and Kenny Q. Zhu
    In Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing, EMNLP 2023, Singapore, December 6-10, 2023 , Oct 2023
  62. Diverse and Vivid Sound Generation from Text Descriptions
    Guangwei Li , Xuenan Xu , Lingfeng Dai , Mengyue Wu, and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , Oct 2023
  63. Investigating Pooling Strategies and Loss Functions for Weakly-Supervised Text-to-Audio Grounding via Contrastive Learning
    Xuenan Xu , Mengyue Wu, and Kai Yu
    In IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2023 - Workshops, Rhodes Island, Greece, June 4-10, 2023 , Oct 2023
  64. BLAT: Bootstrapping Language-Audio Pre-training based on AudioSet Tag-guided Synthetic Data
    Xuenan Xu , Zhiling Zhang , Zelin Zhou , Pingyue Zhang , Zeyu Xie , Mengyue Wu , and Kenny Q. Zhu
    In Proceedings of the 31st ACM International Conference on Multimedia, MM 2023, Ottawa, ON, Canada, 29 October 2023- 3 November 2023 , Oct 2023
  65. LLM-empowered Chatbots for Psychiatrist and Patient Simulation: Application and Evaluation
    Siyuan Chen , Mengyue Wu , Kenny Q. Zhu , Kunyao Lan , Zhiling Zhang , and Lyuchun Cui
    CoRR, Oct 2023
  66. Enhance Temporal Relations in Audio Captioning with Sound Event Detection
    Zeyu Xie , Xuenan Xu , Mengyue Wu, and Kai Yu
    CoRR, Oct 2023
  67. Improving Audio Caption Fluency with Automatic Error Correction
    Hanxue Zhang , Zeyu Xie , Xuenan Xu , Mengyue Wu, and Kai Yu
    CoRR, Oct 2023
  68. A Large-scale Dataset for Audio-Language Representation Learning
    Luoyi Sun , Xuenan Xu , Mengyue Wu, and Weidi Xie
    CoRR, Oct 2023
  69. Does My Dog "Speak" Like Me? The Acoustic Correlation between Pet Dogs and Their Human Owners
    Jieyi Huang , Chunhao Zhang , Yufei Wang , Mengyue Wu , and Kenny Q. Zhu
    CoRR, Oct 2023
  70. Towards Lexical Analysis of Dog Vocalizations via Online Videos
    Yufei Wang , Chunhao Zhang , Jieyi Huang , Mengyue Wu , and Kenny Q. Zhu
    CoRR, Oct 2023
  71. PsyEval: A Comprehensive Large Language Model Evaluation Benchmark for Mental Health
    Haoan Jin , Siyuan Chen , Mengyue Wu , and Kenny Q. Zhu
    CoRR, Oct 2023
  72. A Heterogeneous Graph to Abstract Syntax Tree Framework for Text-to-SQL
    Ruisheng Cao , Lu Chen, Jieyu Li , Hanchong Zhang , Hongshen Xu , Wangyou Zhang , and Kai Yu
    IEEE Trans. Pattern Anal. Mach. Intell., Oct 2023
  73. Speech Enhancement With Integration of Neural Homomorphic Synthesis and Spectral Masking
    Wenbin Jiang , and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2023
  74. SPM: A Split-Parsing Method for Joint Multi-Intent Detection and Slot Filling
    Sheng Jiang , Su Zhu , Ruisheng Cao , Qingliang Miao , and Kai Yu
    In Proceedings of the The 61st Annual Meeting of the Association for Computational Linguistics: Industry Track, ACL 2023, Toronto, Canada, July 9-14, 2023 , Oct 2023
  75. Exploring Schema Generalizability of Text-to-SQL
    Jieyu Li , Lu Chen, Ruisheng Cao , Su Zhu , Hongshen Xu , Zhi Chen , Hanchong Zhang , and Kai Yu
    In Findings of the Association for Computational Linguistics: ACL 2023, Toronto, Canada, July 9-14, 2023 , Oct 2023
  76. TeCS: A Dataset and Benchmark for Tense Consistency of Machine Translation
    Yiming Ai , Zhiwei He , Kai Yu, and Rui Wang
    In Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers), ACL 2023, Toronto, Canada, July 9-14, 2023 , Oct 2023
  77. CSS: A Large-scale Cross-schema Chinese Text-to-SQL Medical Dataset
    Hanchong Zhang , Jieyu Li , Lu Chen, Ruisheng Cao , Yunyan Zhang , Yu Huang , Yefeng Zheng , and Kai Yu
    In Findings of the Association for Computational Linguistics: ACL 2023, Toronto, Canada, July 9-14, 2023 , Oct 2023
  78. ACT-SQL: In-Context Learning for Text-to-SQL with Automatically-Generated Chain-of-Thought
    Hanchong Zhang , Ruisheng Cao , Lu Chen, Hongshen Xu , and Kai Yu
    In Findings of the Association for Computational Linguistics: EMNLP 2023, Singapore, December 6-10, 2023 , Oct 2023
  79. Multi-Speaker Multi-Lingual VQTTS System for LIMMITS 2023 Challenge
    Chenpeng Du , Yiwei Guo , Feiyu Shen , and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , Oct 2023
  80. DiffVoice: Text-to-Speech with Latent Diffusion
    Zhijun Liu , Yiwei Guo , and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , Oct 2023
  81. Large Language Models Are Semi-Parametric Reinforcement Learning Agents
    Danyang Zhang , Lu Chen, Situo Zhang , Hongshen Xu , Zihan Zhao , and Kai Yu
    In Advances in Neural Information Processing Systems 36: Annual Conference on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans, LA, USA, December 10 - 16, 2023 , Oct 2023
  82. Mobile-Env: A Universal Platform for Training and Evaluation of Mobile Interaction
    Danyang Zhang , Lu Chen, and Kai Yu
    CoRR, Oct 2023
  83. SciEval: A Multi-Level Large Language Model Evaluation Benchmark for Scientific Research
    Liangtai Sun , Yang Han , Zihan Zhao , Da Ma , Zhennan Shen , Baocai Chen , Lu Chen, and Kai Yu
    CoRR, Oct 2023
  84. ASTormer: An AST Structure-aware Transformer Decoder for Text-to-SQL
    Ruisheng Cao , Hanchong Zhang , Hongshen Xu , Jieyu Li , Da Ma , Lu Chen, and Kai Yu
    CoRR, Oct 2023
  85. DiffDub: Person-generic Visual Dubbing Using Inpainting Renderer with Diffusion Auto-encoder
    Tao Liu , Chenpeng Du , Shuai Fan , Feilong Chen , and Kai Yu
    CoRR, Oct 2023
  86. SEF-VC: Speaker Embedding Free Zero-Shot Voice Conversion with Cross Attention
    Junjie Li , Yiwei Guo , Xie Chen, and Kai Yu
    CoRR, Oct 2023

2022

  1. Heterogeneous Graph Representation for Knowledge Tracing
    Jisen Chen , Jian Shen , Ting Long , Liping Shen, Weinan Zhang , and Yong Yu
    In Neural Information Processing - 29th International Conference, ICONIP 2022, Virtual Event, November 22-26, 2022, Proceedings, Part I , Oct 2022
  2. A simple but practical method: How to improve the usage of entities in the Chinese question generation
    Haoze Yang , Kunyao Lan , Jiawei You , and Liping Shen
    In International Joint Conference on Neural Networks, IJCNN 2022, Padua, Italy, July 18-23, 2022 , Oct 2022
  3. From Uniform Models To Generic Representations: Stock Return Prediction With Pre-training
    Jiawei You , Tianyuan Han , and Liping Shen
    In International Joint Conference on Neural Networks, IJCNN 2022, Padua, Italy, July 18-23, 2022 , Oct 2022
  4. WavLM: Large-Scale Self-Supervised Pre-Training for Full Stack Speech Processing
    Sanyuan Chen , Chengyi Wang , Zhengyang Chen , Yu Wu , Shujie Liu , Zhuo Chen , Jinyu Li , Naoyuki Kanda , Takuya Yoshioka , Xiong Xiao , Jian Wu , Long Zhou , Shuo Ren , Yanmin Qian , Yao Qian , Jian Wu , Michael Zeng , Xiangzhan Yu , and Furu Wei
    IEEE J. Sel. Top. Signal Process., Oct 2022
  5. Optimizing Data Usage for Low-Resource Speech Recognition
    Yanmin Qian , and Zhikai Zhou
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2022
  6. Dual-Path Modeling With Memory Embedding Model for Continuous Speech Separation
    Chenda Li , Zhuo Chen , and Yanmin Qian
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2022
  7. Layer-Wise Fast Adaptation for End-to-End Multi-Accent Speech Recognition
    Yanmin Qian , Xun Gong , and Houjun Huang
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2022
  8. End-to-End Dereverberation, Beamforming, and Speech Recognition in a Cocktail Party
    Wangyou Zhang , Xuankai Chang , Christoph Böddeker , Tomohiro Nakatani , Shinji Watanabe , and Yanmin Qian
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2022
  9. Time-Domain Audio-Visual Speech Separation on Low Quality Videos
    Yifei Wu , Chenda Li , Jinfeng Bai , Zhongqin Wu , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  10. Skim: Skipping Memory Lstm for Low-Latency Real-Time Continuous Speech Separation
    Chenda Li , Lei Yang , Weiqin Wang , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  11. Large-Scale Self-Supervised Speech Representation Learning for Automatic Speaker Verification
    Zhengyang Chen , Sanyuan Chen , Yu Wu , Yao Qian , Chengyi Wang , Shujie Liu , Yanmin Qian , and Michael Zeng
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  12. Local Information Modeling with Self-Attention for Speaker Verification
    Bing Han , Zhengyang Chen , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  13. Punctuation Prediction for Streaming On-Device Speech Recognition
    Zhikai Zhou , Tian Tan , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  14. MLP-SVNET: A Multi-Layer Perceptrons Based Network for Speaker Verification
    Bing Han , Zhengyang Chen , Bei Liu , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  15. Self-Knowledge Distillation via Feature Enhancement for Speaker Verification
    Bei Liu , Haoyu Wang , Zhengyang Chen , Shuai Wang , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  16. Optimizing Alignment of Speech and Language Latent Spaces for End-To-End Speech Recognition and Understanding
    Wei Wang , Shuo Ren , Yao Qian , Shujie Liu , Yu Shi , Yanmin Qian , and Michael Zeng
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  17. Exploring Effective Data Utilization for Low-Resource Speech Recognition
    Zhikai Zhou , Wei Wang , Wangyou Zhang , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  18. Summary on the ICASSP 2022 Multi-Channel Multi-Party Meeting Transcription Grand Challenge
    Fan Yu , Shiliang Zhang , Pengcheng Guo , Yihui Fu , Zhihao Du , Siqi Zheng , Weilong Huang , Lei Xie , Zheng-Hua Tan , DeLiang Wang , Yanmin Qian , Kong Aik Lee , Zhijie Yan , Bin Ma , Xin Xu , and Hui Bu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  19. The Sjtu System For Multimodal Information Based Speech Processing Challenge 2021
    Wei Wang , Xun Gong , Yifei Wu , Zhikai Zhou , Chenda Li , Wangyou Zhang , Bing Han , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  20. Attentive Feature Fusion for Robust Speaker Verification
    Bei Liu , Zhengyang Chen , and Yanmin Qian
    In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
  21. Dual Path Embedding Learning for Speaker Verification with Triplet Attention
    Bei Liu , Zhengyang Chen , and Yanmin Qian
    In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
  22. DF-ResNet: Boosting Speaker Verification Performance with Depth-First Design
    Bei Liu , Zhengyang Chen , Shuai Wang , Haoyu Wang , Bing Han , and Yanmin Qian
    In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
  23. Enroll-Aware Attentive Statistics Pooling for Target Speaker Verification
    Leying Zhang , Zhengyang Chen , and Yanmin Qian
    In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
  24. MSDWild: Multi-modal Speaker Diarization Dataset in the Wild
    Tao Liu , Shuai Fan , Xu Xiang , Hongbo Song , Shaoxiong Lin , Jiaqi Sun , Tianyuan Han , Siyuan Chen , Binwei Yao , Sen Liu , Yifei Wu , Yanmin Qian , and Kai Yu
    In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
  25. Knowledge Transfer and Distillation from Autoregressive to Non-Autoregessive Speech Recognition
    Xun Gong , Zhikai Zhou , and Yanmin Qian
    In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
  26. Self-Supervised Speaker Verification Using Dynamic Loss-Gate and Label Correction
    Bing Han , Zhengyang Chen , and Yanmin Qian
    In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
  27. Separating Long-Form Speech with Group-wise Permutation Invariant Training
    Wangyou Zhang , Zhuo Chen , Naoyuki Kanda , Shujie Liu , Jinyu Li , Sefik Emre Eskimez , Takuya Yoshioka , Xiong Xiao , Zhong Meng , Yanmin Qian , and Furu Wei
    In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
  28. ESPnet-SE++: Speech Enhancement for Robust Speech Recognition, Translation, and Understanding
    Yen-Ju Lu , Xuankai Chang , Chenda Li , Wangyou Zhang , Samuele Cornell , Zhaoheng Ni , Yoshiki Masuyama , Brian Yan , Robin Scheibler , Zhong-Qiu Wang , Yu Tsao , Yanmin Qian , and Shinji Watanabe
    In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
  29. Improving Speech Separation with Knowledge Distilled from Self-supervised Pre-trained Models
    Bowen Qu , Chenda Li , Jinfeng Bai , and Yanmin Qian
    In 13th International Symposium on Chinese Spoken Language Processing, ISCSLP 2022, Singapore, December 11-14, 2022 , Oct 2022
  30. Text-Informed Knowledge Distillation for Robust Speech Enhancement and Recognition
    Wei Wang , Wangyou Zhang , Shaoxiong Lin , and Yanmin Qian
    In 13th International Symposium on Chinese Spoken Language Processing, ISCSLP 2022, Singapore, December 11-14, 2022 , Oct 2022
  31. Medical Difficult Airway Detection using Speech Technology
    Zhikai Zhou , Shuang Cao , Zhengyang Chen , Bei Liu , Ming Xia , Hong Jiang , and Yanmin Qian
    In 13th International Symposium on Chinese Spoken Language Processing, ISCSLP 2022, Singapore, December 11-14, 2022 , Oct 2022
  32. Speaking style compensation on synthetic audio for robust keyword spotting
    Houjun Huang , and Yanmin Qian
    In 13th International Symposium on Chinese Spoken Language Processing, ISCSLP 2022, Singapore, December 11-14, 2022 , Oct 2022
  33. The Conversational Short-phrase Speaker Diarization (CSSD) Task: Dataset, Evaluation Metric and Baselines
    Gaofeng Cheng , Yifan Chen , Runyan Yang , Qingxuan Li , Zehui Yang , Lingxuan Ye , Pengyuan Zhang , Qingqing Zhang , Lei Xie , Yanmin Qian , Kong Aik Lee , and Yonghong Yan
    In 13th International Symposium on Chinese Spoken Language Processing, ISCSLP 2022, Singapore, December 11-14, 2022 , Oct 2022
  34. The X-Lance Speaker Diarization System for the Conversational Short-phrase Speaker Diarization Challenge 2022
    Tao Liu , Xu Xiang , Zhengyang Chen , Bing Han , Kai Yu, and Yanmin Qian
    In 13th International Symposium on Chinese Spoken Language Processing, ISCSLP 2022, Singapore, December 11-14, 2022 , Oct 2022
  35. End-to-End Multi-Speaker ASR with Independent Vector Analysis
    Robin Scheibler , Wangyou Zhang , Xuankai Chang , Shinji Watanabe , and Yanmin Qian
    In IEEE Spoken Language Technology Workshop, SLT 2022, Doha, Qatar, January 9-12, 2023 , Oct 2022
  36. A Comprehensive Study on Self-Supervised Distillation for Speaker Representation Learning
    Zhengyang Chen , Yao Qian , Bing Han , Yanmin Qian , and Michael Zeng
    In IEEE Spoken Language Technology Workshop, SLT 2022, Doha, Qatar, January 9-12, 2023 , Oct 2022
  37. The SJTU X-LANCE Lab System for CNSRC 2022
    Zhengyang Chen , Bei Liu , Bing Han , Leying Zhang , and Yanmin Qian
    CoRR, Oct 2022
  38. SJTU-AISPEECH System for VoxCeleb Speaker Recognition Challenge 2022
    Zhengyang Chen , Bing Han , Xu Xiang , Houjun Huang , Bei Liu , and Yanmin Qian
    CoRR, Oct 2022
  39. Build a SRE Challenge System: Lessons from VoxSRC 2022 and CNSRC 2022
    Zhengyang Chen , Bing Han , Xu Xiang , Houjun Huang , Bei Liu , and Yanmin Qian
    CoRR, Oct 2022
  40. Factorized Neural Transducer for Efficient Language Model Adaptation
    Xie Chen, Zhong Meng , Sarangarajan Parthasarathy , and Jinyu Li
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  41. VQTTS: High-Fidelity Text-to-Speech Synthesis with Self-Supervised VQ Acoustic Feature
    Chenpeng Du , Yiwei Guo , Xie Chen, and Kai Yu
    In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
  42. Internal Language Model Adaptation with Text-Only Data for End-to-End Speech Recognition
    Zhong Meng , Yashesh Gaur , Naoyuki Kanda , Jinyu Li , Xie Chen , Yu Wu , and Yifan Gong
    In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
  43. Exploring Effective Distillation of Self-Supervised Speech Models for Automatic Speech Recognition
    Yujin Wang , Changli Tang , Ziyang Ma , Zhisheng Zheng , Xie Chen, and Wei-Qiang Zhang
    CoRR, Oct 2022
  44. MT4SSL: Boosting Self-Supervised Speech Representation Learning by Integrating Multiple Targets
    Ziyang Ma , Zhisheng Zheng , Changli Tang , Yujin Wang , and Xie Chen
    CoRR, Oct 2022
  45. EmoDiff: Intensity Controllable Emotional Text-to-Speech with Soft-Label Guidance
    Yiwei Guo , Chenpeng Du , Xie Chen, and Kai Yu
    CoRR, Oct 2022
  46. Exploring Effective Fusion Algorithms for Speech Based Self-Supervised Learning Models
    Changli Tang , Yujin Wang , Xie Chen, and Wei-Qiang Zhang
    CoRR, Oct 2022
  47. D4: a Chinese Dialogue Dataset for Depression-Diagnosis-Oriented Chat
    Binwei Yao , Chao Shi , Likai Zou , Lingfeng Dai , Mengyue WuLu Chen, Zhen Wang , and Kai Yu
    In Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing, EMNLP 2022, Abu Dhabi, United Arab Emirates, December 7-11, 2022 , Oct 2022
  48. Symptom Identification for Interpretable Detection of Multiple Mental Disorders on Social Media
    Zhiling Zhang , Siyuan Chen , Mengyue Wu , and Kenny Q. Zhu
    In Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing, EMNLP 2022, Abu Dhabi, United Arab Emirates, December 7-11, 2022 , Oct 2022
  49. Category-Adapted Sound Event Enhancement with Weakly Labeled Data
    Guangwei Li , Xuenan Xu , Heinrich Dinkel , Mengyue Wu, and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  50. Diversity-Controllable and Accurate Audio Captioning Based on Neural Condition
    Xuenan Xu , Mengyue Wu, and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  51. Can Audio Captions Be Evaluated With Image Caption Metrics?
    Zelin Zhou , Zhiling Zhang , Xuenan Xu , Zeyu Xie , Mengyue Wu , and Kenny Q. Zhu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  52. Navigating Audio-Visual Event Detection Across Mismatched Modalities
    Guangwei Li , Xuenan Xu , Mengyue Wu, and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  53. Audio-Text Retrieval in Context
    Siyu Lou , Xuenan Xu , Mengyue Wu, and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  54. Climate and Weather: Inspecting Depression Detection via Emotion Recognition
    Wen Wu , Mengyue Wu, and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  55. Psychiatric Scale Guided Risky Post Screening for Early Detection of Depression
    Zhiling Zhang , Siyuan Chen , Mengyue Wu , and Kenny Q. Zhu
    In Proceedings of the Thirty-First International Joint Conference on Artificial Intelligence, IJCAI 2022, Vienna, Austria, 23-29 July 2022 , Oct 2022
  56. A Comprehensive Survey of Automated Audio Captioning
    Xuenan Xu , Mengyue Wu, and Kai Yu
    CoRR, Oct 2022
  57. DialogZoo: Large-Scale Dialog-Oriented Task Learning
    Zhi Chen , Jijia Bao , Lu Chen, Yuncong Liu , Da Ma , Bei Chen , Mengyue Wu , Su Zhu , Jian-Guang Lou , and Kai Yu
    CoRR, Oct 2022
  58. Data augmentation based non-parallel voice conversion with frame-level speaker disentangler
    Bo Chen , Zhihang Xu , and Kai Yu
    Speech Commun., Oct 2022
  59. Phone-Level Prosody Modelling With GMM-Based MDN for Diverse and Controllable Speech Synthesis
    Chenpeng Du , and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2022
  60. Neural Fusion for Voice Cloning
    Bo Chen , Chenpeng Du , and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2022
  61. META-GUI: Towards Multi-modal Conversational Agents on Mobile GUI
    Liangtai Sun , Xingyu Chen , Lu Chen, Tianle Dai , Zichen Zhu, and Kai Yu
    In Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing, EMNLP 2022, Abu Dhabi, United Arab Emirates, December 7-11, 2022 , Oct 2022
  62. AdapterShare: Task Correlation Modeling with Adapter Differentiation
    Zhi Chen , Bei Chen , Lu ChenKai Yu, and Jian-Guang Lou
    In Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing, EMNLP 2022, Abu Dhabi, United Arab Emirates, December 7-11, 2022 , Oct 2022
  63. LatticeBART: Lattice-to-Lattice Pre-Training for Speech Recognition
    Lingfeng Dai , Lu Chen, Zhikai Zhou , and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  64. Text Adaptive Detection for Customizable Keyword Spotting
    Yu Xi , Tian Tan , Wangyou Zhang , Baochen Yang , and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  65. Unsupervised Word-Level Prosody Tagging for Controllable Speech Synthesis
    Yiwei Guo , Chenpeng Du , and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
  66. The AISP-SJTU Simultaneous Translation System for IWSLT 2022
    Qinpei Zhu , Renshou Wu , Guangfeng Liu , Xinyu Zhu , Xingyu Chen , Yang Zhou , Qingliang Miao , Rui Wang , and Kai Yu
    In Proceedings of the 19th International Conference on Spoken Language Translation, IWSLT@ACL 2022, Dublin, Ireland (in-person and online), May 26-27, 2022 , Oct 2022
  67. TIE: Topological Information Enhanced Structural Reading Comprehension on Web Pages
    Zihan Zhao , Lu Chen, Ruisheng Cao , Hongshen Xu , Xingyu Chen , and Kai Yu
    In Proceedings of the 2022 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, NAACL 2022, Seattle, WA, United States, July 10-15, 2022 , Oct 2022
  68. UniDU: Towards A Unified Generative Dialogue Understanding Framework
    Zhi Chen , Lu Chen , Bei Chen , Libo Qin , Yuncong Liu , Su Zhu , Jian-Guang Lou , and Kai Yu
    In Proceedings of the 23rd Annual Meeting of the Special Interest Group on Discourse and Dialogue, SIGDIAL 2022, Edinburgh, UK, 07-09 September 2022 , Oct 2022
  69. The AISP-SJTU Translation System for WMT 2022
    Guangfeng Liu , Qinpei Zhu , Xingyu Chen , Renjie Feng , Jianxin Ren , Renshou Wu , Qingliang Miao , Rui Wang , and Kai Yu
    In Proceedings of the Seventh Conference on Machine Translation, WMT 2022, Abu Dhabi, United Arab Emirates (Hybrid), December 7-8, 2022 , Oct 2022

2021

  1. Modified Magnitude-Phase Spectrum Information for Spoofing Detection
    Jichen Yang , Hongji Wang , Rohan Kumar Das , and Yanmin Qian
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2021
  2. Audio-Visual Deep Neural Network for Robust Person Verification
    Yanmin Qian , Zhengyang Chen , and Shuai Wang
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2021
  3. Dual-Path Modeling for Long Recording Speech Separation in Meetings
    Chenda Li , Zhuo Chen , Yi Luo , Cong Han , Tianyan Zhou , Keisuke Kinoshita , Marc Delcroix , Shinji Watanabe , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
  4. Self-Supervised Learning Based Domain Adaptation for Robust Speaker Verification
    Zhengyang Chen , Shuai Wang , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
  5. SynAug: Synthesis-Based Data Augmentation for Text-Dependent Speaker Verification
    Chenpeng Du , Bing Han , Shuai Wang , Yanmin Qian , and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
  6. Unit Selection Synthesis Based Data Augmentation for Fixed Phrase Speaker Verification
    Houjun Huang , Xu Xiang , Fei Zhao , Shuai Wang , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
  7. AISpeech-SJTU Accent Identification System for the Accented English Speech Recognition Challenge
    Houjun Huang , Xu Xiang , Yexin Yang , Rao Ma , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
  8. AISpeech-SJTU ASR System for the Accented English Speech Recognition Challenge
    Tian Tan , Yizhou Lu , Rao Ma , Sen Zhu , Jiaqi Guo , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
  9. Towards Data Selection on TTS Data for Children’s Speech Recognition
    Wei Wang , Zhikai Zhou , Yizhou Lu , Hongji Wang , Chenpeng Du , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
  10. End-to-End Dereverberation, Beamforming, and Speech Recognition with Improved Numerical Stability and Advanced Frontend
    Wangyou Zhang , Christoph Böddeker , Shinji Watanabe , Tomohiro Nakatani , Marc Delcroix , Keisuke Kinoshita , Tsubasa Ochiai , Naoyuki Kamo , Reinhold Haeb-Umbach , and Yanmin Qian
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
  11. The Accented English Speech Recognition Challenge 2020: Open Datasets, Tracks, Baselines, Results and Methods
    Xian Shi , Fan Yu , Yizhou Lu , Yuhao Liang , Qiangze Feng , Daliang Wang , Yanmin Qian , and Lei Xie
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
  12. Convolutive Transfer Function Invariant SDR Training Criteria for Multi-Channel Reverberant Speech Separation
    Christoph Böddeker , Wangyou Zhang , Tomohiro Nakatani , Keisuke Kinoshita , Tsubasa Ochiai , Marc Delcroix , Naoyuki Kamo , Yanmin Qian , and Reinhold Haeb-Umbach
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
  13. Layer-Wise Fast Adaptation for End-to-End Multi-Accent Speech Recognition
    Xun Gong , Yizhou Lu , Zhikai Zhou , and Yanmin Qian
    In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
  14. Knowledge Distillation from Multi-Modality to Single-Modality for Person Verification
    Leying Zhang , Zhengyang Chen , and Yanmin Qian
    In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
  15. Basis-MelGAN: Efficient Neural Vocoder Based on Audio Decomposition
    Zhengxi Liu , and Yanmin Qian
    In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
  16. The SJTU System for Short-Duration Speaker Verification Challenge 2021
    Bing Han , Zhengyang Chen , Zhikai Zhou , and Yanmin Qian
    In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
  17. Audio-Visual Multi-Talker Speech Recognition in a Cocktail Party
    Yifei Wu , Chenda Li , Song Yang , Zhongqin Wu , and Yanmin Qian
    In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
  18. Speaker Embedding Augmentation with Noise Distribution Matching
    Xun Gong , Zhengyang Chen , Yexin Yang , Shuai Wang , Lan Wang , and Yanmin Qian
    In 12th International Symposium on Chinese Spoken Language Processing, ISCSLP 2021, Hong Kong, January 24-27, 2021 , Oct 2021
  19. Revisiting the Statistics Pooling Layer in Deep Speaker Embedding Learning
    Shuai Wang , Yexin Yang , Yanmin Qian , and Kai Yu
    In 12th International Symposium on Chinese Spoken Language Processing, ISCSLP 2021, Hong Kong, January 24-27, 2021 , Oct 2021
  20. Data Augmentation for end-to-end Code-Switching Speech Recognition
    Chenpeng Du , Hao Li , Yizhou Lu , Lan Wang , and Yanmin Qian
    In IEEE Spoken Language Technology Workshop, SLT 2021, Shenzhen, China, January 19-22, 2021 , Oct 2021
  21. Dual-Path RNN for Long Recording Speech Separation
    Chenda Li , Yi Luo , Cong Han , Jinyu Li , Takuya Yoshioka , Tianyan Zhou , Marc Delcroix , Keisuke Kinoshita , Christoph Böddeker , Yanmin Qian , Shinji Watanabe , and Zhuo Chen
    In IEEE Spoken Language Technology Workshop, SLT 2021, Shenzhen, China, January 19-22, 2021 , Oct 2021
  22. Closing the Gap Between Time-Domain Multi-Channel Speech Enhancement on Real and Simulation Conditions
    Wangyou Zhang , Jing Shi , Chenda Li , Shinji Watanabe , and Yanmin Qian
    In IEEE Workshop on Applications of Signal Processing to Audio and Acoustics, WASPAA 2021, New Paltz, NY, USA, October 17-20, 2021 , Oct 2021
  23. Towards Duration Robust Weakly Supervised Sound Event Detection
    Heinrich Dinkel , Mengyue Wu, and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2021
  24. Voice Activity Detection in the Wild: A Data-Driven Approach Using Teacher-Student Training
    Heinrich Dinkel , Shuai Wang , Xuenan Xu , Mengyue Wu, and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2021
  25. Building Interpretable Interaction Trees for Deep NLP Models
    Die Zhang , Hao Zhang , Huilin Zhou , Xiaoyi Bao , Da Huo , Ruizhao Chen , Xu Cheng , Mengyue Wu, and Quanshi Zhang
    In Thirty-Fifth AAAI Conference on Artificial Intelligence, AAAI 2021, Thirty-Third Conference on Innovative Applications of Artificial Intelligence, IAAI 2021, The Eleventh Symposium on Educational Advances in Artificial Intelligence, EAAI 2021, Virtual Event, February 2-9, 2021 , Oct 2021
  26. Decoupled Dialogue Modeling and Semantic Parsing for Multi-Turn Text-to-SQL
    Zhi Chen , Lu Chen, Hanqi Li , Ruisheng Cao , Da Ma , Mengyue Wu, and Kai Yu
    In Findings of the Association for Computational Linguistics: ACL/IJCNLP 2021, Online Event, August 1-6, 2021 , Oct 2021
  27. Enriching Ontology with Temporal Commonsense for Low-Resource Audio Tagging
    Zhiling Zhang , Zelin Zhou , Haifeng Tang , Guangwei Li , Mengyue Wu , and Kenny Q. Zhu
    In CIKM ’21: The 30th ACM International Conference on Information and Knowledge Management, Virtual Event, Queensland, Australia, November 1 - 5, 2021 , Oct 2021
  28. Text-to-Audio Grounding: Building Correspondence Between Captions and Sound Events
    Xuenan Xu , Heinrich Dinkel , Mengyue Wu, and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
  29. Investigating Local and Global Information for Automated Audio Captioning with Transfer Learning
    Xuenan Xu , Heinrich Dinkel , Mengyue Wu, Zeyu Xie , and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
  30. A Lightweight Framework for Online Voice Activity Detection in the Wild
    Xuenan Xu , Heinrich Dinkel , Mengyue Wu, and Kai Yu
    In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
  31. Audio Caption in a Car Setting with a Sentence-Level Loss
    Xuenan Xu , Heinrich Dinkel , Mengyue Wu, and Kai Yu
    In 12th International Symposium on Chinese Spoken Language Processing, ISCSLP 2021, Hong Kong, January 24-27, 2021 , Oct 2021
  32. DEPA: Self-Supervised Audio Embedding for Depression Detection
    Pingyue Zhang , Mengyue Wu, Heinrich Dinkel , and Kai Yu
    In MM ’21: ACM Multimedia Conference, Virtual Event, China, October 20 - 24, 2021 , Oct 2021
  33. LET: Linguistic Knowledge Enhanced Graph Transformer for Chinese Short Text Matching
    Boer Lyu , Lu Chen , Su Zhu , and Kai Yu
    In Thirty-Fifth AAAI Conference on Artificial Intelligence, AAAI 2021, Thirty-Third Conference on Innovative Applications of Artificial Intelligence, IAAI 2021, The Eleventh Symposium on Educational Advances in Artificial Intelligence, EAAI 2021, Virtual Event, February 2-9, 2021 , Oct 2021
  34. LGESQL: Line Graph Enhanced Text-to-SQL Model with Mixed Local and Non-Local Relations
    Ruisheng Cao , Lu Chen , Zhi Chen , Yanbin Zhao , Su Zhu , and Kai Yu
    In Proceedings of the 59th Annual Meeting of the Association for Computational Linguistics and the 11th International Joint Conference on Natural Language Processing, ACL/IJCNLP 2021, (Volume 1: Long Papers), Virtual Event, August 1-6, 2021 , Oct 2021
  35. WebSRC: A Dataset for Web-Based Structural Reading Comprehension
    Xingyu Chen , Zihan Zhao , Lu Chen, Jiabao Ji , Danyang Zhang , Ao Luo , Yuxuan Xiong , and Kai Yu
    In Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing, EMNLP 2021, Virtual Event / Punta Cana, Dominican Republic, 7-11 November, 2021 , Oct 2021
  36. Glyph Enhanced Chinese Character Pre-Training for Lexical Sememe Prediction
    Boer Lyu , Lu Chen, and Kai Yu
    In Findings of the Association for Computational Linguistics: EMNLP 2021, Virtual Event / Punta Cana, Dominican Republic, 16-20 November, 2021 , Oct 2021
  37. Class-Based Neural Network Language Model for Second-Pass Rescoring in ASR
    Lingfeng Dai , Qi Liu , and Kai Yu
    In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
  38. Rich Prosody Diversity Modelling with Phone-Level Mixture Density Network
    Chenpeng Du , and Kai Yu
    In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
  39. ShadowGNN: Graph Projection Neural Network for Text-to-SQL Parser
    Zhi Chen , Lu Chen, Yanbin Zhao , Ruisheng Cao , Zihan Xu , Su Zhu , and Kai Yu
    In Proceedings of the 2021 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, NAACL-HLT 2021, Online, June 6-11, 2021 , Oct 2021
  40. Few-Shot NLU with Vector Projection Distance and Abstract Triangular CRF
    Su Zhu , Lu Chen, Ruisheng Cao , Zhi Chen , Qingliang Miao , and Kai Yu
    In Natural Language Processing and Chinese Computing - 10th CCF International Conference, NLPCC 2021, Qingdao, China, October 13-17, 2021, Proceedings, Part I , Oct 2021
  41. Relation-Aware Multi-hop Reasoning forVisual Dialog
    Yao Zhao , Lu Chen, and Kai Yu
    In Natural Language Processing and Chinese Computing - 10th CCF International Conference, NLPCC 2021, Qingdao, China, October 13-17, 2021, Proceedings, Part I , Oct 2021
  42. Mixture Density Network for Phone-Level Prosody Modelling in Speech Synthesis
    Chenpeng Du , and Kai Yu
    CoRR, Oct 2021
  43. Diverse and Controllable Speech Synthesis with GMM-Based Phone-Level Prosody Modelling
    Chenpeng Du , and Kai Yu
    CoRR, Oct 2021

2020

  1. Improving End-to-End Single-Channel Multi-Talker Speech Recognition
    Wangyou Zhang , Xuankai Chang , Yanmin Qian , and Shinji Watanabe
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2020
  2. Data Augmentation Using Deep Generative Models for Embedding Based Speaker Recognition
    Shuai Wang , Yexin Yang , Zhanghao Wu , Yanmin Qian , and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2020
  3. End-To-End Multi-Speaker Speech Recognition With Transformer
    Xuankai Chang , Wangyou Zhang , Yanmin Qian , Jonathan Le Roux , and Shinji Watanabe
    In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
  4. Text Adaptation for Speaker Verification with Speaker-Text Factorized Embeddings
    Yexin Yang , Shuai Wang , Xun Gong , Yanmin Qian , and Kai Yu
    In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
  5. Channel Invariant Speaker Embedding Learning with Joint Multi-Task and Adversarial Training
    Zhengyang Chen , Shuai Wang , Yanmin Qian , and Kai Yu
    In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
  6. Deep Audio-Visual Speech Separation with Attention Mechanism
    Chenda Li , and Yanmin Qian
    In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
  7. Learning Contextual Language Embeddings for Monaural Multi-Talker Speech Recognition
    Wangyou Zhang , and Yanmin Qian
    In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
  8. End-to-End Far-Field Speech Recognition with Unified Dereverberation and Beamforming
    Wangyou Zhang , Aswin Shanmugam Subramanian , Xuankai Chang , Shinji Watanabe , and Yanmin Qian
    In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
  9. Dual-Adversarial Domain Adaptation for Generalized Replay Attack Detection
    Hongji Wang , Heinrich Dinkel , Shuai Wang , Yanmin Qian , and Kai Yu
    In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
  10. Listen, Watch and Understand at the Cocktail Party: Audio-Visual-Contextual Speech Separation
    Chenda Li , and Yanmin Qian
    In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
  11. Multi-Modality Matters: A Performance Leap on VoxCeleb
    Zhengyang Chen , Shuai Wang , and Yanmin Qian
    In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
  12. Adversarial Domain Adaptation for Speaker Verification Using Partially Shared Network
    Zhengyang Chen , Shuai Wang , and Yanmin Qian
    In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
  13. Bi-Encoder Transformer Network for Mandarin-English Code-Switching Speech Recognition Using Mixture of Experts
    Yizhou Lu , Mingkun Huang , Hao Li , Jiaqi Guo , and Yanmin Qian
    In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
  14. End-to-End Speaker-Dependent Voice Activity Detection
    Yefei Chen , Shuai Wang , Yanmin Qian , and Kai Yu
    CoRR, Oct 2020
  15. A CRNN-GRU Based Reinforcement Learning Approach to Audio Captioning
    Xuenan Xu , Heinrich Dinkel , Mengyue Wu, and Kai Yu
    In Proceedings of 5th the Workshop on Detection and Classification of Acoustic Scenes and Events 2020 (DCASE 2020), Tokyo, Japan (full virtual), November 2-4, 2020 , Oct 2020
  16. Multiple Sound Sources Localization from Coarse to Fine
    Rui Qian , Di Hu , Heinrich Dinkel , Mengyue Wu, Ning Xu , and Weiyao Lin
    In Computer Vision - ECCV 2020 - 16th European Conference, Glasgow, UK, August 23-28, 2020, Proceedings, Part XX , Oct 2020
  17. Voice Activity Detection in the Wild via Weakly Supervised Sound Event Detection
    Yefei Chen , Heinrich Dinkel , Mengyue Wu, and Kai Yu
    In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
  18. GPVAD: Towards noise robust voice activity detection via weakly supervised sound event detection
    Heinrich Dinkel , Yefei Chen , Mengyue Wu, and Kai Yu
    CoRR, Oct 2020
  19. Interpreting Hierarchical Linguistic Interactions in DNNs
    Die Zhang , Huilin Zhou , Xiaoyi Bao , Da Huo , Ruizhao Chen , Xu Cheng , Hao Zhang , Mengyue Wu, and Quanshi Zhang
    CoRR, Oct 2020
  20. Towards a new generation of artificial intelligence in China
    Fei Wu , Cewu Lu , Mingjie Zhu , Hao Chen , Jun Zhu , Kai Yu, Lei Li , Ming Li , Qianfeng Chen , Xi Li , Xudong Cao , Zhongyuan Wang , Zhengjun Zha , Yueting Zhuang , and Yunhe Pan
    Nat. Mach. Intell., Oct 2020
  21. Prior Knowledge Driven Label Embedding for Slot Filling in Natural Language Understanding
    Su Zhu , Zijian Zhao , Rao Ma , and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2020
  22. Dual Learning for Semi-Supervised Natural Language Understanding
    Su Zhu , Ruisheng Cao , and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2020
  23. Modular End-to-End Automatic Speech Recognition Framework for Acoustic-to-Word Model
    Qi Liu , Zhehuai Chen , Hao Li , Mingkun Huang , Yizhou Lu , and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2020
  24. Distributed Structured Actor-Critic Reinforcement Learning for Universal Dialogue Management
    Zhi Chen , Lu Chen, Xiaoyuan Liu , and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2020
  25. Neural Network Language Model Compression With Product Quantization and Soft Binarization
    Kai Yu, Rao Ma , Kaiyu Shi , and Qi Liu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2020
  26. Schema-Guided Multi-Domain Dialogue State Tracking with Graph Attention Neural Networks
    Lu Chen, Boer Lv , Chi Wang , Su Zhu , Bowen Tan , and Kai Yu
    In The Thirty-Fourth AAAI Conference on Artificial Intelligence, AAAI 2020, The Thirty-Second Innovative Applications of Artificial Intelligence Conference, IAAI 2020, The Tenth AAAI Symposium on Educational Advances in Artificial Intelligence, EAAI 2020, New York, NY, USA, February 7-12, 2020 , Oct 2020
  27. Semi-Supervised Text Simplification with Back-Translation and Asymmetric Denoising Autoencoders
    Yanbin Zhao , Lu Chen , Zhi Chen , and Kai Yu
    In The Thirty-Fourth AAAI Conference on Artificial Intelligence, AAAI 2020, The Thirty-Second Innovative Applications of Artificial Intelligence Conference, IAAI 2020, The Tenth AAAI Symposium on Educational Advances in Artificial Intelligence, EAAI 2020, New York, NY, USA, February 7-12, 2020 , Oct 2020
  28. Line Graph Enhanced AMR-to-Text Generation with Mix-Order Graph Attention Networks
    Yanbin Zhao , Lu Chen , Zhi Chen , Ruisheng Cao , Su Zhu , and Kai Yu
    In Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics, ACL 2020, Online, July 5-10, 2020 , Oct 2020
  29. Neural Graph Matching Networks for Chinese Short Text Matching
    Lu Chen, Yanbin Zhao , Boer Lyu , Lesheng Jin , Zhi Chen , Su Zhu , and Kai Yu
    In Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics, ACL 2020, Online, July 5-10, 2020 , Oct 2020
  30. Unsupervised Dual Paraphrasing for Two-stage Semantic Parsing
    Ruisheng Cao , Su Zhu , Chenyu Yang , Chen Liu , Rao Ma , Yanbin Zhao , Lu Chen, and Kai Yu
    In Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics, ACL 2020, Online, July 5-10, 2020 , Oct 2020
  31. Efficient Context and Schema Fusion Networks for Multi-Domain Dialogue State Tracking
    Su Zhu , Jieyu Li , Lu Chen, and Kai Yu
    In Findings of the Association for Computational Linguistics: EMNLP 2020, Online Event, 16-20 November 2020 , Oct 2020
  32. Duration Robust Weakly Supervised Sound Event Detection
    Heinrich Dinkel , and Kai Yu
    In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
  33. Investigation of Specaugment for Deep Speaker Embedding Learning
    Shuai Wang , Johan Rohdin , Oldrich Plchot , Lukás Burget , Kai Yu, and Jan Cernocký
    In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
  34. Speaker Augmentation for Low Resource Speech Recognition
    Chenpeng Du , and Kai Yu
    In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
  35. Neural Lattice Search for Speech Recognition
    Rao Ma , Hao Li , Qi Liu , Lu Chen, and Kai Yu
    In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
  36. A Hierarchical Tracker for Multi-Domain Dialogue State Tracking
    Jieyu Li , Su Zhu , and Kai Yu
    In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
  37. Addressing the Polysemy Problem in Language Modeling with Attentional Multi-Sense Embeddings
    Rao Ma , Lesheng Jin , Qi Liu , Lu Chen, and Kai Yu
    In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
  38. CODA: Improving Resource Utilization by Slimming and Co-locating DNN and CPU Jobs
    Han Zhao , Weihao Cui , Quan Chen , Jingwen Leng , Kai Yu, Deze Zeng , Chao Li , and Minyi Guo
    In 40th IEEE International Conference on Distributed Computing Systems, ICDCS 2020, Singapore, November 29 - December 1, 2020 , Oct 2020
  39. Jointly Encoding Word Confusion Network and Dialogue Context with BERT for Spoken Language Understanding
    Chen Liu , Su Zhu , Zijian Zhao , Ruisheng Cao , Lu Chen, and Kai Yu
    In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
  40. Memory Attention Neural Network for Multi-domain Dialogue State Tracking
    Zihan Xu , Zhi Chen , Lu Chen , Su Zhu , and Kai Yu
    In Natural Language Processing and Chinese Computing - 9th CCF International Conference, NLPCC 2020, Zhengzhou, China, October 14-18, 2020, Proceedings, Part I , Oct 2020
  41. Robust Spoken Language Understanding with RL-Based Value Error Recovery
    Chen Liu , Su Zhu , Lu Chen, and Kai Yu
    In Natural Language Processing and Chinese Computing - 9th CCF International Conference, NLPCC 2020, Zhengzhou, China, October 14-18, 2020, Proceedings, Part I , Oct 2020
  42. An Investigation on Different Underlying Quantization Schemes for Pre-trained Language Models
    Zihan Zhao , Yuncong Liu , Lu Chen, Qi Liu , Rao Ma , and Kai Yu
    In Natural Language Processing and Chinese Computing - 9th CCF International Conference, NLPCC 2020, Zhengzhou, China, October 14-18, 2020, Proceedings, Part I , Oct 2020
  43. An Investigation on Deep Learning with Beta Stabilizer
    Qi Liu , Tian Tan , and Kai Yu
    CoRR, Oct 2020
  44. Vector Projection Network for Few-shot Slot Tagging in Natural Language Understanding
    Su Zhu , Ruisheng Cao , Lu Chen, and Kai Yu
    CoRR, Oct 2020
  45. Deep Reinforcement Learning for On-line Dialogue State Tracking
    Zhi Chen , Lu Chen, Xiang Zhou , and Kai Yu
    CoRR, Oct 2020
  46. Structured Hierarchical Dialogue Policy with Graph Neural Networks
    Zhi Chen , Xiaoyuan Liu , Lu Chen, and Kai Yu
    CoRR, Oct 2020
  47. Dual Learning for Dialogue State Tracking
    Zhi Chen , Lu Chen, Yanbin Zhao , Su Zhu , and Kai Yu
    CoRR, Oct 2020
  48. CREDIT: Coarse-to-Fine Sequence Generation for Dialogue State Tracking
    Zhi Chen , Lu Chen, Zihan Xu , Yanbin Zhao , Su Zhu , and Kai Yu
    CoRR, Oct 2020

2019

  1. Erratum to: Past review, current progress, and challenges ahead on the cocktail party problem
    Yanmin Qian , Chao Weng , Xuankai Chang , Shuai Wang , and Dong Yu
    Frontiers Inf. Technol. Electron. Eng., Oct 2019
  2. Binary neural networks for speech recognition
    Yanmin Qian , and Xu Xiang
    Frontiers Inf. Technol. Electron. Eng., Oct 2019
  3. Data augmentation using generative adversarial networks for robust speech recognition
    Yanmin Qian , Hu Hu , and Tian Tan
    Speech Commun., Oct 2019
  4. Discriminative Neural Embedding Learning for Short-Duration Text-Independent Speaker Verification
    Shuai Wang , Zili Huang , Yanmin Qian , and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2019
  5. Margin Matters: Towards More Discriminative Deep Neural Network Embeddings for Speaker Recognition
    Xu Xiang , Shuai Wang , Houjun Huang , Yanmin Qian , and Kai Yu
    In 2019 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference, APSIPA ASC 2019, Lanzhou, China, November 18-21, 2019 , Oct 2019
  6. GANs for Children: A Generative Data Augmentation Strategy for Children Speech Recognition
    Peiyao Sheng , Zhuolin Yang , and Yanmin Qian
    In IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2019, Singapore, December 14-18, 2019 , Oct 2019
  7. MIMO-Speech: End-to-End Multi-Channel Multi-Speaker Speech Recognition
    Xuankai Chang , Wangyou Zhang , Yanmin Qian , Jonathan Le Roux , and Shinji Watanabe
    In IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2019, Singapore, December 14-18, 2019 , Oct 2019
  8. Exploring Model Units and Training Strategies for End-to-End Speech Recognition
    Mingkun Huang , Yizhou Lu , Lan Wang , Yanmin Qian , and Kai Yu
    In IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2019, Singapore, December 14-18, 2019 , Oct 2019
  9. End-to-End Overlapped Speech Detection and Speaker Counting with Raw Waveform
    Wangyou Zhang , Man Sun , Lan Wang , and Yanmin Qian
    In IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2019, Singapore, December 14-18, 2019 , Oct 2019
  10. Knowledge Distillation for Small Foot-print Deep Speaker Embedding
    Shuai Wang , Yexin Yang , Tianzhe Wang , Yanmin Qian , and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2019, Brighton, United Kingdom, May 12-17, 2019 , Oct 2019
  11. End-to-end Monaural Multi-speaker ASR System without Pretraining
    Xuankai Chang , Yanmin Qian , Kai Yu, and Shinji Watanabe
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2019, Brighton, United Kingdom, May 12-17, 2019 , Oct 2019
  12. The SJTU Robust Anti-Spoofing System for the ASVspoof 2019 Challenge
    Yexin Yang , Hongji Wang , Heinrich Dinkel , Zhengyang Chen , Shuai Wang , Yanmin Qian , and Kai Yu
    In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
  13. On the Usage of Phonetic Information for Text-Independent Speaker Embedding Extraction
    Shuai Wang , Johan Rohdin , Lukás Burget , Oldrich Plchot , Yanmin Qian , Kai Yu, and Jan Cernocký
    In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
  14. Data Augmentation Using Variational Autoencoder for Embedding Based Speaker Verification
    Zhanghao Wu , Shuai Wang , Yanmin Qian , and Kai Yu
    In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
  15. Joint Decoding of CTC Based Systems for Speech Recognition
    Jiaqi Guo , Yongbin You , Yanmin Qian , and Kai Yu
    In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
  16. Knowledge Distillation for End-to-End Monaural Multi-Talker ASR System
    Wangyou Zhang , Xuankai Chang , and Yanmin Qian
    In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
  17. Robust DOA Estimation Based on Convolutional Neural Network and Time-Frequency Masking
    Wangyou Zhang , Ying Zhou , and Yanmin Qian
    In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
  18. Cross-Domain Replay Spoofing Attack Detection Using Domain Adversarial Training
    Hongji Wang , Heinrich Dinkel , Shuai Wang , Yanmin Qian , and Kai Yu
    In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
  19. Prosody Usage Optimization for Children Speech Recognition with Zero Resource Children Speech
    Chenda Li , and Yanmin Qian
    In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
  20. Audio Caption: Listen and Tell
    Mengyue Wu, Heinrich Dinkel , and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2019, Brighton, United Kingdom, May 12-17, 2019 , Oct 2019
  21. Text-based Depression Detection: What Triggers An Alert
    Heinrich Dinkel , Mengyue Wu, and Kai Yu
    CoRR, Oct 2019
  22. What does a Car-ssette tape tell?
    Xuenan Xu , Heinrich Dinkel , Mengyue Wu, and Kai Yu
    CoRR, Oct 2019
  23. AgentGraph: Toward Universal Dialogue Management With Structured Deep Reinforcement Learning
    Lu Chen , Zhi Chen , Bowen Tan , Sishan Long , Milica Gasic , and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2019
  24. Semantic Parsing with Dual Learning
    Ruisheng Cao , Su Zhu , Chen Liu , Jieyu Li , and Kai Yu
    In Proceedings of the 57th Conference of the Association for Computational Linguistics, ACL 2019, Florence, Italy, July 28- August 2, 2019, Volume 1: Long Papers , Oct 2019
  25. Highly Efficient Neural Network Language Model Compression Using Soft Binarization Training
    Rao Ma , Qi Liu , and Kai Yu
    In IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2019, Singapore, December 14-18, 2019 , Oct 2019
  26. Data Augmentation with Atomic Templates for Spoken Language Understanding
    Zijian Zhao , Su Zhu , and Kai Yu
    In Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing and the 9th International Joint Conference on Natural Language Processing, EMNLP-IJCNLP 2019, Hong Kong, China, November 3-7, 2019 , Oct 2019
  27. A Hierarchical Decoding Model for Spoken Language Understanding from Unaligned Data
    Zijian Zhao , Su Zhu , and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2019, Brighton, United Kingdom, May 12-17, 2019 , Oct 2019
  28. CATSLU: The 1st Chinese Audio-Textual Spoken Language Understanding Challenge
    Su Zhu , Zijian Zhao , Tiejun Zhao , Chengqing Zong , and Kai Yu
    In International Conference on Multimodal Interaction, ICMI 2019, Suzhou, China, October 14-18, 2019 , Oct 2019
  29. Robust Spoken Language Understanding with Acoustic and Domain Knowledge
    Hao Li , Chen Liu , Su Zhu , and Kai Yu
    In International Conference on Multimodal Interaction, ICMI 2019, Suzhou, China, October 14-18, 2019 , Oct 2019
  30. Cross Aggregation of Multi-head Attention for Neural Machine Translation
    Juncheng Cao , Hai Zhao , and Kai Yu
    In Natural Language Processing and Chinese Computing - 8th CCF International Conference, NLPCC 2019, Dunhuang, China, October 9-14, 2019, Proceedings, Part I , Oct 2019
  31. International Conference on Multimodal Interaction, ICMI 2019, Suzhou, China, October 14-18, 2019
    Oct 2019

2018

  1. Past review, current progress, and challenges ahead on the cocktail party problem
    Yanmin Qian , Chao Weng , Xuankai Chang , Shuai Wang , and Dong Yu
    Frontiers Inf. Technol. Electron. Eng., Oct 2018
  2. Erratum to: Past review, current progress, and challenges ahead on the cocktail party problem
    Yanmin Qian , Chao Weng , Xuankai Chang , Shuai Wang , and Dong Yu
    Frontiers Inf. Technol. Electron. Eng., Oct 2018
  3. Sequence discriminative training for deep learning based acoustic keyword spotting
    Zhehuai Chen , Yanmin Qian , and Kai Yu
    Speech Commun., Oct 2018
  4. Single-channel multi-talker speech recognition with permutation invariant training
    Yanmin Qian , Xuankai Chang , and Dong Yu
    Speech Commun., Oct 2018
  5. Adaptive Very Deep Convolutional Residual Network for Noise Robust Speech Recognition
    Tian Tan , Yanmin Qian , Hu Hu , Ying Zhou , Wen Ding , and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2018
  6. Investigating Raw Wave Deep Neural Networks for End-to-End Speaker Spoofing Detection
    Heinrich Dinkel , Yanmin Qian , and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2018
  7. Robust Mask Estimation By Integrating Neural Network-Based and Clustering-Based Approaches for Adaptive Acoustic Beamforming
    Ying Zhou , and Yanmin Qian
    In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
  8. Knowledge Transfer in Permutation Invariant Training for Single-Channel Multi-Talker Speech Recognition
    Tian Tan , Yanmin Qian , and Dong Yu
    In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
  9. Joint I-Vector with End-to-End System for Short Duration Text-Independent Speaker Verification
    Zili Huang , Shuai Wang , and Yanmin Qian
    In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
  10. Generative Adversarial Networks Based Data Augmentation for Noise Robust Speech Recognition
    Hu Hu , Tian Tan , and Yanmin Qian
    In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
  11. Focal Kl-Divergence Based Dilated Convolutional Neural Networks for Co-Channel Speaker Identification
    Shuai Wang , Yanmin Qian , and Kai Yu
    In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
  12. Noise Robust Speech Recognition on Aurora4 by Humans and Machines
    Yanmin Qian , Tian Tan , Hu Hu , and Qi Liu
    In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
  13. Fast Adaptation on Deepmixture Generative Network Based Acoustic Modeling
    Wen Ding , Tian Tan , and Yanmin Qian
    In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
  14. Adaptive Permutation Invariant Training with Auxiliary Information for Monaural Multi-Talker Speech Recognition
    Xuankai Chang , Yanmin Qian , and Dong Yu
    In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
  15. Permutation Invariant Training of Generative Adversarial Network for Monaural Speech Separation
    Lianwu Chen , Meng Yu , Yanmin Qian , Dan Su , and Dong Yu
    In Interspeech 2018, 19th Annual Conference of the International Speech Communication Association, Hyderabad, India, 2-6 September 2018 , Oct 2018
  16. Deep Extractor Network for Target Speaker Recovery from Single Channel Speech Mixtures
    Jun Wang , Jie Chen , Dan Su , Lianwu Chen , Meng Yu , Yanmin Qian , and Dong Yu
    In Interspeech 2018, 19th Annual Conference of the International Speech Communication Association, Hyderabad, India, 2-6 September 2018 , Oct 2018
  17. Monaural Multi-Talker Speech Recognition with Attention Mechanism and Gated Convolutional Networks
    Xuankai Chang , Yanmin Qian , and Dong Yu
    In Interspeech 2018, 19th Annual Conference of the International Speech Communication Association, Hyderabad, India, 2-6 September 2018 , Oct 2018
  18. Knowledge Distillation for Sequence Model
    Mingkun Huang , Yongbin You , Zhehuai Chen , Yanmin Qian , and Kai Yu
    In Interspeech 2018, 19th Annual Conference of the International Speech Communication Association, Hyderabad, India, 2-6 September 2018 , Oct 2018
  19. Covariance Based Deep Feature for Text-Dependent Speaker Verification
    Shuai Wang , Heinrich Dinkel , Yanmin Qian , and Kai Yu
    In Intelligence Science and Big Data Engineering - 8th International Conference, IScIDE 2018, Lanzhou, China, August 18-19, 2018, Revised Selected Papers , Oct 2018
  20. Data Augmentation using Conditional Generative Adversarial Networks for Robust Speech Recognition
    Peiyao Sheng , Zhuolin Yang , Hu Hu , Tian Tan , and Yanmin Qian
    In 11th International Symposium on Chinese Spoken Language Processing, ISCSLP 2018, Taipei City, Taiwan, November 26-29, 2018 , Oct 2018
  21. Deep Discriminant Analysis for i-vector Based Robust Speaker Recognition
    Shuai Wang , Zili Huang , Yanmin Qian , and Kai Yu
    In 11th International Symposium on Chinese Spoken Language Processing, ISCSLP 2018, Taipei City, Taiwan, November 26-29, 2018 , Oct 2018
  22. Generative Adversarial Networks based X-vector Augmentation for Robust Probabilistic Linear Discriminant Analysis in Speaker Verification
    Yexin Yang , Shuai Wang , Man Sun , Yanmin Qian , and Kai Yu
    In 11th International Symposium on Chinese Spoken Language Processing, ISCSLP 2018, Taipei City, Taiwan, November 26-29, 2018 , Oct 2018
  23. Rich Short Text Conversation Using Semantic-Key-Controlled Sequence Generation
    Kai Yu, Zijian Zhao , Xueyang Wu , Hongtao Lin , and Xuan Liu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2018
  24. Structured Dialogue Policy with Graph Neural Networks
    Lu Chen, Bowen Tan , Sishan Long , and Kai Yu
    In Proceedings of the 27th International Conference on Computational Linguistics, COLING 2018, Santa Fe, New Mexico, USA, August 20-26, 2018 , Oct 2018
  25. Towards Universal Dialogue State Tracking
    Liliang Ren , Kaige Xie , Lu Chen, and Kai Yu
    In Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing, Brussels, Belgium, October 31 - November 4, 2018 , Oct 2018
  26. On Modular Training of Neural Acoustics-to-Word Model for LVCSR
    Zhehuai Chen , Qi Liu , Hao Li , and Kai Yu
    In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
  27. Semi-Supervised Training Using Adversarial Multi-Task Learning for Spoken Language Understanding
    Ouyu Lan , Su Zhu , and Kai Yu
    In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
  28. Policy Adaptation for Deep Reinforcement Learning-Based Dialogue Management
    Lu Chen, Cheng Chang , Zhi Chen , Bowen Tan , Milica Gasic , and Kai Yu
    In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
  29. Robust Spoken Language Understanding with Unsupervised ASR-Error Adaptation
    Su Zhu , Ouyu Lan , and Kai Yu
    In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
  30. MLN: Moment localization Network and Samples Selection for Moment Retrieval
    Bo Huang , Ya Zhang , and Kai Yu
    In Proceedings of the 2nd International Conference on Video and Image Processing, ICVIP 2018, Hong Kong, China, December 29-31, 2018 , Oct 2018
  31. Angular Softmax for Short-Duration Text-independent Speaker Verification
    Zili Huang , Shuai Wang , and Kai Yu
    In Interspeech 2018, 19th Annual Conference of the International Speech Communication Association, Hyderabad, India, 2-6 September 2018 , Oct 2018
  32. Joint Spoken Language Understanding and Domain Adaptive Language Modeling
    Huifeng Zhang , Su Zhu , Shuai Fan , and Kai Yu
    In Intelligence Science and Big Data Engineering - 8th International Conference, IScIDE 2018, Lanzhou, China, August 18-19, 2018, Revised Selected Papers , Oct 2018
  33. Binarized LSTM Language Model
    Xuan Liu , Di Cao , and Kai Yu
    In Proceedings of the 2018 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, NAACL-HLT 2018, New Orleans, Louisiana, USA, June 1-6, 2018, Volume 1 (Long Papers) , Oct 2018
  34. Cost-Sensitive Active Learning for Dialogue State Tracking
    Kaige Xie , Cheng Chang , Liliang Ren , Lu Chen, and Kai Yu
    In Proceedings of the 19th Annual SIGdial Meeting on Discourse and Dialogue, Melbourne, Australia, July 12-14, 2018 , Oct 2018
  35. Concept Transfer Learning for Adaptive Language Understanding
    Su Zhu , and Kai Yu
    In Proceedings of the 19th Annual SIGdial Meeting on Discourse and Dialogue, Melbourne, Australia, July 12-14, 2018 , Oct 2018
  36. Intelligence Science and Big Data Engineering - 8th International Conference, IScIDE 2018, Lanzhou, China, August 18-19, 2018, Revised Selected Papers
    Oct 2018

2017

  1. Phone Synchronous Speech Recognition With CTC Lattices
    Zhehuai Chen , Yimeng Zhuang , Yanmin Qian , and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2017
  2. Deep Feature Engineering for Noise Robust Spoofing Detection
    Yanmin Qian , Nanxin Chen , Heinrich Dinkel , and Zhizheng Wu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2017
  3. Integrating online i-vector into GMM-UBM for text-dependent speaker verification
    Xiaowei Jiang , Shuai Wang , Xu Xiang , and Yanmin Qian
    In 2017 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference, APSIPA ASC 2017, Kuala Lumpur, Malaysia, December 12-15, 2017 , Oct 2017
  4. Future vector enhanced LSTM language model for LVCSR
    Qi Liu , Yanmin Qian , and Kai Yu
    In 2017 IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2017, Okinawa, Japan, December 16-20, 2017 , Oct 2017
  5. Multi-view LSTM Language Model with Word-Synchronized Auxiliary Feature for LVCSR
    Yue Wu , Tianxing He , Zhehuai Chen , Yanmin Qian , and Kai Yu
    In Chinese Computational Linguistics and Natural Language Processing Based on Naturally Annotated Big Data - 16th China National Conference, CCL 2017, - and - 5th International Symposium, NLP-NABD 2017, Nanjing, China, October 13-15, 2017, Proceedings , Oct 2017
  6. End-to-end spoofing detection with raw waveform CLDNNS
    Heinrich Dinkel , Nanxin Chen , Yanmin Qian , and Kai Yu
    In 2017 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2017, New Orleans, LA, USA, March 5-9, 2017 , Oct 2017
  7. Small-footprint convolutional neural network for spoofing detection
    Heinrich Dinkel , Yanmin Qian , and Kai Yu
    In 2017 International Joint Conference on Neural Networks, IJCNN 2017, Anchorage, AK, USA, May 14-19, 2017 , Oct 2017
  8. Binary Deep Neural Networks for Speech Recognition
    Xu Xiang , Yanmin Qian , and Kai Yu
    In Interspeech 2017, 18th Annual Conference of the International Speech Communication Association, Stockholm, Sweden, August 20-24, 2017 , Oct 2017
  9. What Does the Speaker Embedding Encode?
    Shuai Wang , Yanmin Qian , and Kai Yu
    In Interspeech 2017, 18th Annual Conference of the International Speech Communication Association, Stockholm, Sweden, August 20-24, 2017 , Oct 2017
  10. Recognizing Multi-Talker Speech with Permutation Invariant Training
    Dong Yu , Xuankai Chang , and Yanmin Qian
    In Interspeech 2017, 18th Annual Conference of the International Speech Communication Association, Stockholm, Sweden, August 20-24, 2017 , Oct 2017
  11. A Unified Confidence Measure Framework Using Auxiliary Normalization Graph
    Zhehuai Chen , Yanmin Qian , and Kai Yu
    In Intelligence Science and Big Data Engineering - 7th International Conference, IScIDE 2017, Dalian, China, September 22-23, 2017, Proceedings , Oct 2017
  12. Adaptation of Deep Neural Network Acoustic Models for Robust Automatic Speech Recognition
    Khe Chai Sim , Yanmin Qian , Gautam Mantena , Lahiru Samarakoon , Souvik Kundu , and Tian Tan
    In New Era for Robust Speech Recognition, Exploiting Deep Learning , Oct 2017
  13. On-line Dialogue Policy Learning with Companion Teaching
    Lu Chen, Runzhe Yang , Cheng Chang , Zihao Ye , Xiang Zhou , and Kai Yu
    In Proceedings of the 15th Conference of the European Chapter of the Association for Computational Linguistics, EACL 2017, Valencia, Spain, April 3-7, 2017, Volume 2: Short Papers , Oct 2017
  14. Affordable On-line Dialogue Policy Learning
    Cheng Chang , Runzhe Yang , Lu Chen, Xiang Zhou , and Kai Yu
    In Proceedings of the 2017 Conference on Empirical Methods in Natural Language Processing, EMNLP 2017, Copenhagen, Denmark, September 9-11, 2017 , Oct 2017
  15. Agent-Aware Dropout DQN for Safe and Efficient On-line Dialogue Policy Learning
    Lu Chen, Xiang Zhou , Cheng Chang , Runzhe Yang , and Kai Yu
    In Proceedings of the 2017 Conference on Empirical Methods in Natural Language Processing, EMNLP 2017, Copenhagen, Denmark, September 9-11, 2017 , Oct 2017
  16. Confidence measures for CTC-based phone synchronous decoding
    Zhehuai Chen , Yimeng Zhuang , and Kai Yu
    In 2017 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2017, New Orleans, LA, USA, March 5-9, 2017 , Oct 2017
  17. Encoder-decoder with focus-mechanism for sequence labelling based spoken language understanding
    Su Zhu , and Kai Yu
    In 2017 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2017, New Orleans, LA, USA, March 5-9, 2017 , Oct 2017
  18. Discrete Duration Model for Speech Synthesis
    Bo Chen , Tianling Bian , and Kai Yu
    In Interspeech 2017, 18th Annual Conference of the International Speech Communication Association, Stockholm, Sweden, August 20-24, 2017 , Oct 2017
  19. Deep Attentive Structured Language Model Based on LSTM
    Di Cao , and Kai Yu
    In Intelligence Science and Big Data Engineering - 7th International Conference, IScIDE 2017, Dalian, China, September 22-23, 2017, Proceedings , Oct 2017
  20. splab at the NTCIR-13 STC-2 Task
    Xuan Liu , Xueyang Wu , Ruinian Chen , Zijian Zhao , Hongtao Lin , and Kai Yu
    In The 13th NTCIR Conference, Evaluation of Information Access Technologies, National Center of Sciences, Tokyo, Japan, December 5-8, 2017 , Oct 2017

2016

  1. Deep features for automatic spoofing detection
    Yanmin Qian , Nanxin Chen , and Kai Yu
    Speech Commun., Oct 2016
  2. Cluster Adaptive Training for Deep Neural Network Based Acoustic Model
    Tian Tan , Yanmin Qian , and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2016
  3. Neural Network Based Multi-Factor Aware Joint Training for Robust Speech Recognition
    Yanmin Qian , Tian Tan , and Dong Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2016
  4. Very Deep Convolutional Neural Networks for Noise Robust Speech Recognition
    Yanmin Qian , Mengxiao Bi , Tian Tan , and Kai Yu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2016
  5. Overview of BTAS 2016 speaker anti-spoofing competition
    Pavel Korshunov , Sébastien Marcel , Hannah Muckenhirn , André R. Gonçalves , A. G. Souza Mello , Ricardo Paranhos Velloso Violato , Flávio Olmos Simões , M. U. Neto , Marcus Assis Angeloni , José Augusto Stuchi , Heinrich Dinkel , Nanxin Chen , Yanmin Qian , Dipjyoti Paul , Goutam Saha , and Md. Sahidullah
    In 8th IEEE International Conference on Biometrics Theory, Applications and Systems, BTAS 2016, Niagara Falls, NY, USA, September 6-9, 2016 , Oct 2016
  6. Joint acoustic factor learning for robust deep neural network based automatic speech recognition
    Souvik Kundu , Gautam Mantena , Yanmin Qian , Tian Tan , Marc Delcroix , and Khe Chai Sim
    In 2016 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2016, Shanghai, China, March 20-25, 2016 , Oct 2016
  7. Speaker-aware training of LSTM-RNNS for acoustic modelling
    Tian Tan , Yanmin Qian , Dong Yu , Souvik Kundu , Liang Lu , Khe Chai Sim , Xiong Xiao , and Yu Zhang
    In 2016 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2016, Shanghai, China, March 20-25, 2016 , Oct 2016
  8. Improved DNN-based segmentation for multi-genre broadcast audio
    Linlin Wang , Chao Zhang , Philip C. Woodland , Mark J. F. Gales , Panagiota Karanasou , Pierre Lanchantin , Xunying Liu , and Yanmin Qian
    In 2016 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2016, Shanghai, China, March 20-25, 2016 , Oct 2016
  9. An investigation into using parallel data for far-field speech recognition
    Yanmin Qian , Tian Tan , and Dong Yu
    In 2016 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2016, Shanghai, China, March 20-25, 2016 , Oct 2016
  10. Integrated adaptation with multi-factor joint-learning for far-field speech recognition
    Yanmin Qian , Tian Tan , Dong Yu , and Yu Zhang
    In 2016 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2016, Shanghai, China, March 20-25, 2016 , Oct 2016
  11. Unrestricted Vocabulary Keyword Spotting Using LSTM-CTC
    Yimeng Zhuang , Xuankai Chang , Yanmin Qian , and Kai Yu
    In Interspeech 2016, 17th Annual Conference of the International Speech Communication Association, San Francisco, CA, USA, September 8-12, 2016 , Oct 2016
  12. Multi-task joint-learning for robust voice activity detection
    Yimeng Zhuang , Sibo Tong , Maofan Yin , Yanmin Qian , and Kai Yu
    In 10th International Symposium on Chinese Spoken Language Processing, ISCSLP 2016, Tianjin, China, October 17-20, 2016 , Oct 2016
  13. Very deep convolutional neural networks for robust speech recognition
    Yanmin Qian , and Philip C. Woodland
    In 2016 IEEE Spoken Language Technology Workshop, SLT 2016, San Diego, CA, USA, December 13-16, 2016 , Oct 2016
  14. Evolvable dialogue state tracking for statistical dialogue management
    Kai YuLu Chen, Kai Sun , Qizhe Xie , and Su Zhu
    Frontiers Comput. Sci., Oct 2016
  15. Discriminatively trained joint speaker and environment representations for adaptation of deep neural network acoustic models
    Maofan Yin , Sunil Sivadas , Kai Yu, and Bin Ma
    In 2016 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2016, Shanghai, China, March 20-25, 2016 , Oct 2016
  16. A comparative study of robustness of deep learning approaches for VAD
    Sibo Tong , Hao Gu , and Kai Yu
    In 2016 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2016, Shanghai, China, March 20-25, 2016 , Oct 2016
  17. Phone Synchronous Decoding with CTC Lattice
    Zhehuai Chen , Wei Deng , Tao Xu , and Kai Yu
    In Interspeech 2016, 17th Annual Conference of the International Speech Communication Association, San Francisco, CA, USA, September 8-12, 2016 , Oct 2016
  18. Hybrid Dialogue State Tracking for Real World Human-to-Human Dialogues
    Kai Sun , Su Zhu , Lu Chen, Siqiu Yao , Xueyang Wu , and Kai Yu
    In Interspeech 2016, 17th Annual Conference of the International Speech Communication Association, San Francisco, CA, USA, September 8-12, 2016 , Oct 2016
  19. On training bi-directional neural network language model with noise contrastive estimation
    Tianxing He , Yu Zhang , Jasha Droppo , and Kai Yu
    In 10th International Symposium on Chinese Spoken Language Processing, ISCSLP 2016, Tianjin, China, October 17-20, 2016 , Oct 2016
  20. Rich punctuations prediction using large-scale deep learning
    Xueyang Wu , Su Zhu , Yue Wu , and Kai Yu
    In 10th International Symposium on Chinese Spoken Language Processing, ISCSLP 2016, Tianjin, China, October 17-20, 2016 , Oct 2016
  21. Directed automatic speech transcription error correction using bidirectional LSTM
    Da Zheng , Zhehuai Chen , Yue Wu , and Kai Yu
    In 10th International Symposium on Chinese Spoken Language Processing, ISCSLP 2016, Tianjin, China, October 17-20, 2016 , Oct 2016
  22. The splab at the NTCIR-12 Short Text Conversation Task
    Ke Wu , Xuan Liu , and Kai Yu
    In Proceedings of the 12th NTCIR Conference on Evaluation of Information Access Technologies, National Center of Sciences, Tokyo, Japan, June 7-10, 2016 , Oct 2016

2015

  1. Deep feature for text-dependent speaker verification
    Yuan Liu , Yanmin Qian , Nanxin Chen , Tianfan Fu , Ya Zhang , and Kai Yu
    Speech Commun., Oct 2015
  2. Multi-task joint-learning of deep neural networks for robust speech recognition
    Yanmin Qian , Maofan Yin , Yongbin You , and Kai Yu
    In 2015 IEEE Workshop on Automatic Speech Recognition and Understanding, ASRU 2015, Scottsdale, AZ, USA, December 13-17, 2015 , Oct 2015
  3. Cambridge university transcription systems for the multi-genre broadcast challenge
    Philip C. Woodland , Xunying Liu , Yanmin Qian , Chao Zhang , Mark J. F. Gales , Penny Karanasou , Pierre Lanchantin , and Linlin Wang
    In 2015 IEEE Workshop on Automatic Speech Recognition and Understanding, ASRU 2015, Scottsdale, AZ, USA, December 13-17, 2015 , Oct 2015
  4. The development of the cambridge university alignment systems for the multi-genre broadcast challenge
    Pierre Lanchantin , Mark J. F. Gales , Penny Karanasou , Xunying Liu , Yanmin Qian , Linlin Wang , Philip C. Woodland , and Chao Zhang
    In 2015 IEEE Workshop on Automatic Speech Recognition and Understanding, ASRU 2015, Scottsdale, AZ, USA, December 13-17, 2015 , Oct 2015
  5. Speaker diarisation and longitudinal linking in multi-genre broadcast data
    Penny Karanasou , Mark J. F. Gales , Pierre Lanchantin , Xunying Liu , Yanmin Qian , Linlin Wang , Philip C. Woodland , and Chao Zhang
    In 2015 IEEE Workshop on Automatic Speech Recognition and Understanding, ASRU 2015, Scottsdale, AZ, USA, December 13-17, 2015 , Oct 2015
  6. Local trajectory based speech enhancement for robust speech recognition with deep neural network
    Yongbin You , Yanmin Qian , and Kai Yu
    In IEEE China Summit and International Conference on Signal and Information Processing, ChinaSIP 2015, Chengdu, China, July 12-15, 2015 , Oct 2015
  7. An investigation on DNN-derived bottleneck features for GMM-HMM based robust speech recognition
    Yongbin You , Yanmin Qian , Tianxing He , and Kai Yu
    In IEEE China Summit and International Conference on Signal and Information Processing, ChinaSIP 2015, Chengdu, China, July 12-15, 2015 , Oct 2015
  8. Cluster adaptive training for deep neural network
    Tian Tan , Yanmin Qian , Maofan Yin , Yimeng Zhuang , and Kai Yu
    In 2015 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2015, South Brisbane, Queensland, Australia, April 19-24, 2015 , Oct 2015
  9. A novel static parameter calculation method for model compensation
    Suliang Bu , Yunxin Zhao , Yanmin Qian , and Kai Yu
    In 2015 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2015, South Brisbane, Queensland, Australia, April 19-24, 2015 , Oct 2015
  10. Recurrent neural network language model with structured word embeddings for speech recognition
    Tianxing He , Xu Xiang , Yanmin Qian , and Kai Yu
    In 2015 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2015, South Brisbane, Queensland, Australia, April 19-24, 2015 , Oct 2015
  11. Automatic model redundancy reduction for fast back-propagation for deep neural networks in speech recognition
    Yanmin Qian , Tianxing He , Wei Deng , and Kai Yu
    In 2015 International Joint Conference on Neural Networks, IJCNN 2015, Killarney, Ireland, July 12-17, 2015 , Oct 2015
  12. Multi-task learning for text-dependent speaker verification
    Nanxin Chen , Yanmin Qian , and Kai Yu
    In INTERSPEECH 2015, 16th Annual Conference of the International Speech Communication Association, Dresden, Germany, September 6-10, 2015 , Oct 2015
  13. Robust deep feature for spoofing detection - the SJTU system for ASVspoof 2015 challenge
    Nanxin Chen , Yanmin Qian , Heinrich Dinkel , Bo Chen , and Kai Yu
    In INTERSPEECH 2015, 16th Annual Conference of the International Speech Communication Association, Dresden, Germany, September 6-10, 2015 , Oct 2015
  14. Very deep convolutional neural networks for LVCSR
    Mengxiao Bi , Yanmin Qian , and Kai Yu
    In INTERSPEECH 2015, 16th Annual Conference of the International Speech Communication Association, Dresden, Germany, September 6-10, 2015 , Oct 2015
  15. Paragraph vector based topic model for language model adaptation
    Wengong Jin , Tianxing He , Yanmin Qian , and Kai Yu
    In INTERSPEECH 2015, 16th Annual Conference of the International Speech Communication Association, Dresden, Germany, September 6-10, 2015 , Oct 2015
  16. Constrained Markov Bayesian Polynomial for Efficient Dialogue State Tracking
    Kai Yu, Kai Sun , Lu Chen , and Su Zhu
    IEEE ACM Trans. Audio Speech Lang. Process., Oct 2015
  17. An investigation of context clustering for statistical speech synthesis with deep neural network
    Bo Chen , Zhehuai Chen , Jiachen Xu , and Kai Yu
    In INTERSPEECH 2015, 16th Annual Conference of the International Speech Communication Association, Dresden, Germany, September 6-10, 2015 , Oct 2015
  18. Recurrent Polynomial Network for Dialogue State Tracking with Mismatched Semantic Parsers
    Qizhe Xie , Kai Sun , Su Zhu , Lu Chen, and Kai Yu
    In Proceedings of the SIGDIAL 2015 Conference, The 16th Annual Meeting of the Special Interest Group on Discourse and Dialogue, 2-4 September 2015, Prague, Czech Republic , Oct 2015
  19. Hyper-parameter Optimisation of Gaussian Process Reinforcement Learning for Statistical Dialogue Management
    Lu Chen, Pei-Hao Su , and Milica Gasic
    In Proceedings of the SIGDIAL 2015 Conference, The 16th Annual Meeting of the Special Interest Group on Discourse and Dialogue, 2-4 September 2015, Prague, Czech Republic , Oct 2015

2014

  1. Stochastic data sweeping for fast DNN training
    Wei Deng , Yanmin Qian , Yuchen Fan , Tianfan Fu , and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2014, Florence, Italy, May 4-9, 2014 , Oct 2014
  2. Reshaping deep neural network for fast decoding by node-pruning
    Tianxing He , Yuchen Fan , Yanmin Qian , Tian Tan , and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2014, Florence, Italy, May 4-9, 2014 , Oct 2014
  3. Second order vector taylor series based robust speech recognition
    Suliang Bu , Yanmin Qian , Khe Chai Sim , Yongbin You , and Kai Yu
    In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2014, Florence, Italy, May 4-9, 2014 , Oct 2014
  4. Speaker verification with deep features
    Yuan Liu , Tianfan Fu , Yuchen Fan , Yanmin Qian , and Kai Yu
    In 2014 International Joint Conference on Neural Networks, IJCNN 2014, Beijing, China, July 6-11, 2014 , Oct 2014
  5. Tandem deep features for text-dependent speaker verification
    Tianfan Fu , Yanmin Qian , Yuan Liu , and Kai Yu
    In INTERSPEECH 2014, 15th Annual Conference of the International Speech Communication Association, Singapore, September 14-18, 2014 , Oct 2014
  6. A novel dynamic parameters calculation approach for model compensation
    Suliang Bu , Yanmin Qian , and Kai Yu
    In INTERSPEECH 2014, 15th Annual Conference of the International Speech Communication Association, Singapore, September 14-18, 2014 , Oct 2014
  7. Acoustic emotion recognition using deep neural network
    Jianwei Niu , Yanmin Qian , and Kai Yu
    In The 9th International Symposium on Chinese Spoken Language Processing, Singapore, September 12-14, 2014 , Oct 2014
  8. The SJTU System for Dialog State Tracking Challenge 2
    Kai Sun , Lu Chen , Su Zhu , and Kai Yu
    In Proceedings of the SIGDIAL 2014 Conference, The 15th Annual Meeting of the Special Interest Group on Discourse and Dialogue, 18-20 June 2014, Philadelphia, PA, USA , Oct 2014
  9. A generalized rule based tracker for dialogue state tracking
    Kai Sun , Lu Chen , Su Zhu , and Kai Yu
    In 2014 IEEE Spoken Language Technology Workshop, SLT 2014, South Lake Tahoe, NV, USA, December 7-10, 2014 , Oct 2014
  10. Semantic parser enhancement for dialogue domain extension with little data
    Su Zhu , Lu Chen, Kai Sun , Da Zheng , and Kai Yu
    In 2014 IEEE Spoken Language Technology Workshop, SLT 2014, South Lake Tahoe, NV, USA, December 7-10, 2014 , Oct 2014

2013

  1. Combination of data borrowing strategies for low-resource LVCSR
    Yanmin Qian , Kai Yu, and Jia Liu
    In 2013 IEEE Workshop on Automatic Speech Recognition and Understanding, Olomouc, Czech Republic, December 8-12, 2013 , Oct 2013
  2. MLP-HMM two-stage unsupervised training for low-resource languages on conversational telephone speech recognition
    Yanmin Qian , and Jia Liu
    In INTERSPEECH 2013, 14th Annual Conference of the International Speech Communication Association, Lyon, France, August 25-29, 2013 , Oct 2013
  3. A New Word Language Model Evaluation Metric for Character Based Languages
    Peilu Wang , Ruihua Sun , Hai Zhao , and Kai Yu
    In Chinese Computational Linguistics and Natural Language Processing Based on Naturally Annotated Big Data - 12th China National Conference, CCL 2013 and First International Symposium, NLP-NABD 2013, Suzhou, China, October 10-12, 2013. Proceedings , Oct 2013

2012

  1. Introduction to the Issue on Advances in Spoken Dialogue Systems and Mobile Interface
    Jason D. Williams , Kai Yu, Brahim Chaib-draa , Oliver Lemon , Roberto Pieraccini , Olivier Pietquin , Pascal Poupart , and Steve J. Young
    IEEE J. Sel. Top. Signal Process., Oct 2012
  2. ICMI’12 grand challenge: haptic voice recognition
    Khe Chai Sim , Shengdong Zhao , Kai Yu, and Hank Liao
    In International Conference on Multimodal Interaction, ICMI ’12, Santa Monica, CA, USA, October 22-26, 2012 , Oct 2012
  3. Development of the 2012 SJTU HVR system
    Hainan Xu , Yuchen Fan , and Kai Yu
    In International Conference on Multimodal Interaction, ICMI ’12, Santa Monica, CA, USA, October 22-26, 2012 , Oct 2012
\ No newline at end of file diff --git a/projects/1_project/index.html b/projects/1_project/index.html index 3f2117861b3c..d2c33ba23d70 100644 --- a/projects/1_project/index.html +++ b/projects/1_project/index.html @@ -1,4 +1,4 @@ - project 1 | X - LANCE

project 1

a project with a background image

Every project has a beautiful feature showcase page. It’s easy to include images in a flexible 3-column grid format. Make your photos 1/3, 2/3, or full width.

To give your project a background in the portfolio page, just add the img tag to the front matter like so:

---
+        project 1 | X - LANCE                  

project 1

a project with a background image

Every project has a beautiful feature showcase page. It’s easy to include images in a flexible 3-column grid format. Make your photos 1/3, 2/3, or full width.

To give your project a background in the portfolio page, just add the img tag to the front matter like so:

---
 layout: page
 title: project
 description: a project with a background image
diff --git a/projects/2_project/index.html b/projects/2_project/index.html
index 3172b13dc3cf..3fd37dfebcce 100644
--- a/projects/2_project/index.html
+++ b/projects/2_project/index.html
@@ -1,4 +1,4 @@
-        project 2 | X - LANCE                  

project 2

a project with a background image and giscus comments

Every project has a beautiful feature showcase page. It’s easy to include images in a flexible 3-column grid format. Make your photos 1/3, 2/3, or full width.

To give your project a background in the portfolio page, just add the img tag to the front matter like so:

---
+        project 2 | X - LANCE                  

project 2

a project with a background image and giscus comments

Every project has a beautiful feature showcase page. It’s easy to include images in a flexible 3-column grid format. Make your photos 1/3, 2/3, or full width.

To give your project a background in the portfolio page, just add the img tag to the front matter like so:

---
 layout: page
 title: project
 description: a project with a background image
diff --git a/projects/3_project/index.html b/projects/3_project/index.html
index 4ad32db9bc79..086f363fefa1 100644
--- a/projects/3_project/index.html
+++ b/projects/3_project/index.html
@@ -1,4 +1,4 @@
-         project 3 | X - LANCE                  

project 3

a project that redirects to another website

Every project has a beautiful feature showcase page. It’s easy to include images in a flexible 3-column grid format. Make your photos 1/3, 2/3, or full width.

To give your project a background in the portfolio page, just add the img tag to the front matter like so:

---
+         project 3 | X - LANCE                  

project 3

a project that redirects to another website

Every project has a beautiful feature showcase page. It’s easy to include images in a flexible 3-column grid format. Make your photos 1/3, 2/3, or full width.

To give your project a background in the portfolio page, just add the img tag to the front matter like so:

---
 layout: page
 title: project
 description: a project with a background image
diff --git a/projects/4_project/index.html b/projects/4_project/index.html
index 8d701e6be009..9798d885b9c6 100644
--- a/projects/4_project/index.html
+++ b/projects/4_project/index.html
@@ -1,4 +1,4 @@
-        project 4 | X - LANCE                  

project 4

another without an image

Every project has a beautiful feature showcase page. It’s easy to include images in a flexible 3-column grid format. Make your photos 1/3, 2/3, or full width.

To give your project a background in the portfolio page, just add the img tag to the front matter like so:

---
+        project 4 | X - LANCE                  

project 4

another without an image

Every project has a beautiful feature showcase page. It’s easy to include images in a flexible 3-column grid format. Make your photos 1/3, 2/3, or full width.

To give your project a background in the portfolio page, just add the img tag to the front matter like so:

---
 layout: page
 title: project
 description: a project with a background image
diff --git a/projects/5_project/index.html b/projects/5_project/index.html
index a8c81474da39..8fd8e55c0642 100644
--- a/projects/5_project/index.html
+++ b/projects/5_project/index.html
@@ -1,4 +1,4 @@
-        project 5 | X - LANCE                  

project 5

a project with a background image

Every project has a beautiful feature showcase page. It’s easy to include images in a flexible 3-column grid format. Make your photos 1/3, 2/3, or full width.

To give your project a background in the portfolio page, just add the img tag to the front matter like so:

---
+        project 5 | X - LANCE                  

project 5

a project with a background image

Every project has a beautiful feature showcase page. It’s easy to include images in a flexible 3-column grid format. Make your photos 1/3, 2/3, or full width.

To give your project a background in the portfolio page, just add the img tag to the front matter like so:

---
 layout: page
 title: project
 description: a project with a background image
diff --git a/projects/6_project/index.html b/projects/6_project/index.html
index d21b78a10f8c..8d14d8a4f736 100644
--- a/projects/6_project/index.html
+++ b/projects/6_project/index.html
@@ -1,4 +1,4 @@
-        project 6 | X - LANCE                  

project 6

a project with no image

Every project has a beautiful feature showcase page. It’s easy to include images in a flexible 3-column grid format. Make your photos 1/3, 2/3, or full width.

To give your project a background in the portfolio page, just add the img tag to the front matter like so:

---
+        project 6 | X - LANCE                  

project 6

a project with no image

Every project has a beautiful feature showcase page. It’s easy to include images in a flexible 3-column grid format. Make your photos 1/3, 2/3, or full width.

To give your project a background in the portfolio page, just add the img tag to the front matter like so:

---
 layout: page
 title: project
 description: a project with a background image
diff --git a/projects/index.html b/projects/index.html
index 3be447d73a65..e2cdae12a39d 100644
--- a/projects/index.html
+++ b/projects/index.html
@@ -1 +1 @@
-        Projects | X - LANCE                  
© Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
\ No newline at end of file + Projects | X - LANCE
© Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
\ No newline at end of file diff --git a/repositories/index.html b/repositories/index.html index 9cfaed3cfd96..b59c7721ebcf 100644 --- a/repositories/index.html +++ b/repositories/index.html @@ -1 +1 @@ - Repos | X - LANCE

Repos

GitHub repositories (selected) of X-LANCE

© Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
\ No newline at end of file + Repos | X - LANCE

Repos

GitHub repositories (selected) of X-LANCE

© Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
\ No newline at end of file diff --git a/sitemap.xml b/sitemap.xml index 14fb44e23bd0..fbdbc87102d0 100644 --- a/sitemap.xml +++ b/sitemap.xml @@ -1 +1 @@ - https://x-lance.github.io/news/announcement_1/ 2023-12-31T00:00:00+00:00 https://x-lance.github.io/news/announcement_2/ 2023-12-31T00:00:00+00:00 https://x-lance.github.io/news/announcement_5/ 2024-01-24T00:00:00+00:00 https://x-lance.github.io/news/announcement_3/ 2024-02-29T00:00:00+00:00 https://x-lance.github.io/news/announcement_4/ 2024-03-14T00:00:00+00:00 https://x-lance.github.io/news/announcement_6/ 2024-04-07T00:00:00+00:00 https://x-lance.github.io/news/announcement_7/ 2024-05-02T00:00:00+00:00 https://x-lance.github.io/news/announcement_8/ 2024-05-16T00:00:00+00:00 https://x-lance.github.io/news/announcement_9/ 2024-05-18T00:00:00+00:00 https://x-lance.github.io/blog/2015/formatting-and-links/ 2015-03-15T16:40:16+00:00 https://x-lance.github.io/blog/2015/images/ 2015-05-15T21:01:00+00:00 https://x-lance.github.io/blog/2015/code/ 2015-07-15T15:09:00+00:00 https://x-lance.github.io/blog/2015/math/ 2015-10-20T15:12:00+00:00 https://x-lance.github.io/blog/2015/disqus-comments/ 2015-10-20T15:59:00+00:00 https://x-lance.github.io/blog/2018/distill/ 2018-12-22T00:00:00+00:00 https://x-lance.github.io/blog/2020/twitter/ 2020-09-28T15:12:00+00:00 https://x-lance.github.io/blog/2020/github-metadata/ 2020-09-28T21:01:00+00:00 https://x-lance.github.io/blog/2021/diagrams/ 2021-07-04T17:39:00+00:00 https://x-lance.github.io/blog/2022/redirect/ 2022-02-01T17:39:00+00:00 https://x-lance.github.io/blog/2022/giscus-comments/ 2022-12-10T15:59:00+00:00 https://x-lance.github.io/blog/2023/table-of-contents/ 2023-03-20T15:59:00+00:00 https://x-lance.github.io/blog/2023/tables/ 2023-03-20T18:37:00+00:00 https://x-lance.github.io/blog/2023/videos/ 2023-04-24T21:01:00+00:00 https://x-lance.github.io/blog/2023/audios/ 2023-04-25T10:25:00+00:00 https://x-lance.github.io/blog/2023/sidebar-table-of-contents/ 2023-04-25T14:14:00+00:00 https://x-lance.github.io/blog/2023/custom-blockquotes/ 2023-05-12T19:53:00+00:00 https://x-lance.github.io/blog/2023/jupyter-notebook/ 2023-07-04T12:57:00+00:00 https://x-lance.github.io/blog/2023/post-bibliography/ 2023-07-12T13:56:00+00:00 https://x-lance.github.io/blog/2023/tikzjax/ 2023-12-12T22:25:00+00:00 https://x-lance.github.io/blog/2024/chartjs/ 2024-01-26T01:04:00+00:00 https://x-lance.github.io/blog/2024/echarts/ 2024-01-26T16:03:00+00:00 https://x-lance.github.io/blog/2024/geojson-map/ 2024-01-26T17:57:00+00:00 https://x-lance.github.io/blog/2024/vega-lite/ 2024-01-27T00:20:00+00:00 https://x-lance.github.io/blog/2024/advanced-images/ 2024-01-27T11:46:00+00:00 https://x-lance.github.io/blog/2024/code-diff/ 2024-01-27T19:22:00+00:00 https://x-lance.github.io/blog/2022/displaying-external-posts-on-your-al-folio-blog/ 2022-04-23T23:20:09+00:00 https://x-lance.github.io/projects/1_project/ 2024-05-26T02:44:10+00:00 https://x-lance.github.io/projects/2_project/ 2024-05-26T02:44:10+00:00 https://x-lance.github.io/projects/3_project/ 2024-05-26T02:44:10+00:00 https://x-lance.github.io/projects/4_project/ 2024-05-26T02:44:10+00:00 https://x-lance.github.io/projects/5_project/ 2024-05-26T02:44:10+00:00 https://x-lance.github.io/projects/6_project/ 2024-05-26T02:44:10+00:00 https://x-lance.github.io/ https://x-lance.github.io/members/alumni/ https://x-lance.github.io/cv/ https://x-lance.github.io/members/faculty/ https://x-lance.github.io/_pages/en/members/ https://x-lance.github.io/news/ https://x-lance.github.io/papers/ https://x-lance.github.io/projects/ https://x-lance.github.io/repositories/ https://x-lance.github.io/members/student/ https://x-lance.github.io/teaching/ https://x-lance.github.io/_pages/en/under_construction/ https://x-lance.github.io/blog/tag/formatting/ https://x-lance.github.io/blog/tag/links/ https://x-lance.github.io/blog/tag/images/ https://x-lance.github.io/blog/tag/code/ https://x-lance.github.io/blog/tag/math/ https://x-lance.github.io/blog/tag/comments/ https://x-lance.github.io/blog/tag/distill/ https://x-lance.github.io/blog/tag/metadata/ https://x-lance.github.io/blog/tag/diagrams/ https://x-lance.github.io/blog/tag/toc/ https://x-lance.github.io/blog/tag/tables/ https://x-lance.github.io/blog/tag/videos/ https://x-lance.github.io/blog/tag/audios/ https://x-lance.github.io/blog/tag/sidebar/ https://x-lance.github.io/blog/tag/blockquotes/ https://x-lance.github.io/blog/tag/jupyter/ https://x-lance.github.io/blog/tag/bib/ https://x-lance.github.io/blog/tag/charts/ https://x-lance.github.io/blog/tag/maps/ https://x-lance.github.io/blog/category/sample-posts/ https://x-lance.github.io/blog/category/external-services/ https://x-lance.github.io/blog/2015/ https://x-lance.github.io/blog/2018/ https://x-lance.github.io/blog/2020/ https://x-lance.github.io/blog/2021/ https://x-lance.github.io/blog/2022/ https://x-lance.github.io/blog/2023/ https://x-lance.github.io/blog/2024/ https://x-lance.github.io/blog/ https://x-lance.github.io/blog/page/2/ https://x-lance.github.io/blog/page/3/ https://x-lance.github.io/blog/page/4/ https://x-lance.github.io/blog/page/5/ https://x-lance.github.io/blog/page/6/ \ No newline at end of file + https://x-lance.github.io/news/announcement_1/ 2023-12-31T00:00:00+00:00 https://x-lance.github.io/news/announcement_2/ 2023-12-31T00:00:00+00:00 https://x-lance.github.io/news/announcement_5/ 2024-01-24T00:00:00+00:00 https://x-lance.github.io/news/announcement_3/ 2024-02-29T00:00:00+00:00 https://x-lance.github.io/news/announcement_4/ 2024-03-14T00:00:00+00:00 https://x-lance.github.io/news/announcement_6/ 2024-04-07T00:00:00+00:00 https://x-lance.github.io/news/announcement_7/ 2024-05-02T00:00:00+00:00 https://x-lance.github.io/news/announcement_8/ 2024-05-16T00:00:00+00:00 https://x-lance.github.io/news/announcement_9/ 2024-05-18T00:00:00+00:00 https://x-lance.github.io/blog/2015/formatting-and-links/ 2015-03-15T16:40:16+00:00 https://x-lance.github.io/blog/2015/images/ 2015-05-15T21:01:00+00:00 https://x-lance.github.io/blog/2015/code/ 2015-07-15T15:09:00+00:00 https://x-lance.github.io/blog/2015/math/ 2015-10-20T15:12:00+00:00 https://x-lance.github.io/blog/2015/disqus-comments/ 2015-10-20T15:59:00+00:00 https://x-lance.github.io/blog/2018/distill/ 2018-12-22T00:00:00+00:00 https://x-lance.github.io/blog/2020/twitter/ 2020-09-28T15:12:00+00:00 https://x-lance.github.io/blog/2020/github-metadata/ 2020-09-28T21:01:00+00:00 https://x-lance.github.io/blog/2021/diagrams/ 2021-07-04T17:39:00+00:00 https://x-lance.github.io/blog/2022/redirect/ 2022-02-01T17:39:00+00:00 https://x-lance.github.io/blog/2022/giscus-comments/ 2022-12-10T15:59:00+00:00 https://x-lance.github.io/blog/2023/table-of-contents/ 2023-03-20T15:59:00+00:00 https://x-lance.github.io/blog/2023/tables/ 2023-03-20T18:37:00+00:00 https://x-lance.github.io/blog/2023/videos/ 2023-04-24T21:01:00+00:00 https://x-lance.github.io/blog/2023/audios/ 2023-04-25T10:25:00+00:00 https://x-lance.github.io/blog/2023/sidebar-table-of-contents/ 2023-04-25T14:14:00+00:00 https://x-lance.github.io/blog/2023/custom-blockquotes/ 2023-05-12T19:53:00+00:00 https://x-lance.github.io/blog/2023/jupyter-notebook/ 2023-07-04T12:57:00+00:00 https://x-lance.github.io/blog/2023/post-bibliography/ 2023-07-12T13:56:00+00:00 https://x-lance.github.io/blog/2023/tikzjax/ 2023-12-12T22:25:00+00:00 https://x-lance.github.io/blog/2024/chartjs/ 2024-01-26T01:04:00+00:00 https://x-lance.github.io/blog/2024/echarts/ 2024-01-26T16:03:00+00:00 https://x-lance.github.io/blog/2024/geojson-map/ 2024-01-26T17:57:00+00:00 https://x-lance.github.io/blog/2024/vega-lite/ 2024-01-27T00:20:00+00:00 https://x-lance.github.io/blog/2024/advanced-images/ 2024-01-27T11:46:00+00:00 https://x-lance.github.io/blog/2024/code-diff/ 2024-01-27T19:22:00+00:00 https://x-lance.github.io/blog/2022/displaying-external-posts-on-your-al-folio-blog/ 2022-04-23T23:20:09+00:00 https://x-lance.github.io/projects/1_project/ 2024-05-26T02:54:38+00:00 https://x-lance.github.io/projects/2_project/ 2024-05-26T02:54:38+00:00 https://x-lance.github.io/projects/3_project/ 2024-05-26T02:54:38+00:00 https://x-lance.github.io/projects/4_project/ 2024-05-26T02:54:38+00:00 https://x-lance.github.io/projects/5_project/ 2024-05-26T02:54:38+00:00 https://x-lance.github.io/projects/6_project/ 2024-05-26T02:54:38+00:00 https://x-lance.github.io/ https://x-lance.github.io/members/alumni/ https://x-lance.github.io/cv/ https://x-lance.github.io/members/faculty/ https://x-lance.github.io/_pages/en/members/ https://x-lance.github.io/news/ https://x-lance.github.io/papers/ https://x-lance.github.io/projects/ https://x-lance.github.io/repositories/ https://x-lance.github.io/members/student/ https://x-lance.github.io/teaching/ https://x-lance.github.io/_pages/en/under_construction/ https://x-lance.github.io/blog/tag/formatting/ https://x-lance.github.io/blog/tag/links/ https://x-lance.github.io/blog/tag/images/ https://x-lance.github.io/blog/tag/code/ https://x-lance.github.io/blog/tag/math/ https://x-lance.github.io/blog/tag/comments/ https://x-lance.github.io/blog/tag/distill/ https://x-lance.github.io/blog/tag/metadata/ https://x-lance.github.io/blog/tag/diagrams/ https://x-lance.github.io/blog/tag/toc/ https://x-lance.github.io/blog/tag/tables/ https://x-lance.github.io/blog/tag/videos/ https://x-lance.github.io/blog/tag/audios/ https://x-lance.github.io/blog/tag/sidebar/ https://x-lance.github.io/blog/tag/blockquotes/ https://x-lance.github.io/blog/tag/jupyter/ https://x-lance.github.io/blog/tag/bib/ https://x-lance.github.io/blog/tag/charts/ https://x-lance.github.io/blog/tag/maps/ https://x-lance.github.io/blog/category/sample-posts/ https://x-lance.github.io/blog/category/external-services/ https://x-lance.github.io/blog/2015/ https://x-lance.github.io/blog/2018/ https://x-lance.github.io/blog/2020/ https://x-lance.github.io/blog/2021/ https://x-lance.github.io/blog/2022/ https://x-lance.github.io/blog/2023/ https://x-lance.github.io/blog/2024/ https://x-lance.github.io/blog/ https://x-lance.github.io/blog/page/2/ https://x-lance.github.io/blog/page/3/ https://x-lance.github.io/blog/page/4/ https://x-lance.github.io/blog/page/5/ https://x-lance.github.io/blog/page/6/ \ No newline at end of file diff --git a/teaching/index.html b/teaching/index.html index 0a828234c10d..f13d7de53e92 100644 --- a/teaching/index.html +++ b/teaching/index.html @@ -1 +1 @@ - Teaching | X - LANCE

Teaching

Courses offered by X-LANCE

Spring 2024

  • Intelligent Speech Technology [AI2304 AI2651] Kai Yu, Yanmin Qian

Fall 2023

  • Lectures on Frontiers of Artificial Intelligence [AI3605] Kai Yu
  • Natural Language Processing [CS3602 CS4314] Kai Yu, Lu Chen, Rui Wang -Computer Networks [ICE4407P] Liping Shen
  • Computer Networks (D) [CS3311] Liping Shen, Na Ruan
  • Discrete Mathematics [CS2501] Liping Shen
  • Academic Writing, Norms, and Ethics [GE6001] Mengyue Wu

Spring 2023

  • Intelligent Speech Technology [AI2304 AI2651] Kai Yu, Yanmin Qian
  • Knowledge Representation and Reasoning [AI3612] Lu Chen

Fall 2022

  • Lectures on Frontiers of Artificial Intelligence [AI3605] Kai Yu
  • Natural Language Processing [CS3602 CS4314] Kai Yu, Lu Chen, Rui Wang
  • Discrete Mathematics [CS2501] Liping Shen
  • Programming Design and Methodology (C++) [CS1501] Xie Chen
  • Academic Writing, Norms, and Ethics [GE6001] Mengyue Wu

Spring 2022

  • Intelligent Speech Technology [AI2304 AI2651] Kai Yu, Yanmin Qian
  • Knowledge Representation and Reasoning [AI3612] Lu Chen
  • Intelligent Perception and Cognition Practice [AI3611] Mengyue Wu, Xie Chen

Fall 2021

  • Lectures on Frontiers of Artificial Intelligence [AI3605] Kai Yu
  • Natural Language Processing [CS3602 CS4314] Kai Yu, Lu Chen, Rui Wang
  • Computer Networks (D) [CS3311] Liping Shen, Na Ruan
  • Discrete Mathematics [CS2501] Liping Shen

Spring 2021

  • Intelligent Speech Technology [AI2304 AI2651] Kai Yu, Yanmin Qian

Fall 2020

  • Programming Design and Methodology (C++) [CS1501] Liping Shen

Unclassified or Earlier

  • Computer Organization and Architecture [ICE4406P] Liping Shen, Shizhen Zhao
  • Computer Ethics [CS3309] Mengyue Wu
© Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
\ No newline at end of file + Teaching | X - LANCE

Teaching

Courses offered by X-LANCE

Spring 2024

  • Intelligent Speech Technology [AI2304 AI2651] Kai Yu, Yanmin Qian

Fall 2023

  • Lectures on Frontiers of Artificial Intelligence [AI3605] Kai Yu
  • Natural Language Processing [CS3602 CS4314] Kai Yu, Lu Chen, Rui Wang -Computer Networks [ICE4407P] Liping Shen
  • Computer Networks (D) [CS3311] Liping Shen, Na Ruan
  • Discrete Mathematics [CS2501] Liping Shen
  • Academic Writing, Norms, and Ethics [GE6001] Mengyue Wu

Spring 2023

  • Intelligent Speech Technology [AI2304 AI2651] Kai Yu, Yanmin Qian
  • Knowledge Representation and Reasoning [AI3612] Lu Chen

Fall 2022

  • Lectures on Frontiers of Artificial Intelligence [AI3605] Kai Yu
  • Natural Language Processing [CS3602 CS4314] Kai Yu, Lu Chen, Rui Wang
  • Discrete Mathematics [CS2501] Liping Shen
  • Programming Design and Methodology (C++) [CS1501] Xie Chen
  • Academic Writing, Norms, and Ethics [GE6001] Mengyue Wu

Spring 2022

  • Intelligent Speech Technology [AI2304 AI2651] Kai Yu, Yanmin Qian
  • Knowledge Representation and Reasoning [AI3612] Lu Chen
  • Intelligent Perception and Cognition Practice [AI3611] Mengyue Wu, Xie Chen

Fall 2021

  • Lectures on Frontiers of Artificial Intelligence [AI3605] Kai Yu
  • Natural Language Processing [CS3602 CS4314] Kai Yu, Lu Chen, Rui Wang
  • Computer Networks (D) [CS3311] Liping Shen, Na Ruan
  • Discrete Mathematics [CS2501] Liping Shen

Spring 2021

  • Intelligent Speech Technology [AI2304 AI2651] Kai Yu, Yanmin Qian

Fall 2020

  • Programming Design and Methodology (C++) [CS1501] Liping Shen

Unclassified or Earlier

  • Computer Organization and Architecture [ICE4406P] Liping Shen, Shizhen Zhao
  • Computer Ethics [CS3309] Mengyue Wu
© Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
\ No newline at end of file diff --git a/zh/404.html b/zh/404.html index 0dad2f09ce57..13ca7e504dc1 100644 --- a/zh/404.html +++ b/zh/404.html @@ -1 +1 @@ - 没有找到页面 | X - LANCE

没有找到页面

看起来出现了问题。这里什么都没有。

您将在 3 秒内被重定向到主页。如果未重定向,请返回 主页

© Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
\ No newline at end of file + 没有找到页面 | X - LANCE

没有找到页面

看起来出现了问题。这里什么都没有。

您将在 3 秒内被重定向到主页。如果未重定向,请返回 主页

© Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
\ No newline at end of file diff --git a/zh/_pages/zh/members/index.html b/zh/_pages/zh/members/index.html index ea126d4703fe..ffb587e082ac 100644 --- a/zh/_pages/zh/members/index.html +++ b/zh/_pages/zh/members/index.html @@ -1 +1 @@ - 🙌成员 | X - LANCE

🙌成员

© Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
\ No newline at end of file + 🙌成员 | X - LANCE

🙌成员

© Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
\ No newline at end of file diff --git a/zh/_pages/zh/under_construction/index.html b/zh/_pages/zh/under_construction/index.html index 4a4b765f5692..219ad9e773d2 100644 --- a/zh/_pages/zh/under_construction/index.html +++ b/zh/_pages/zh/under_construction/index.html @@ -1 +1 @@ - 🛠️搭建中 | X - LANCE

🛠️搭建中

© Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
\ No newline at end of file + 🛠️搭建中 | X - LANCE

🛠️搭建中

© Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
\ No newline at end of file diff --git a/zh/blog/2015/code/index.html b/zh/blog/2015/code/index.html index 75237e54e085..7311a4085248 100644 --- a/zh/blog/2015/code/index.html +++ b/zh/blog/2015/code/index.html @@ -1,4 +1,4 @@ - a post with code | X - LANCE

a post with code

This theme implements a built-in Jekyll feature, the use of Rouge, for syntax highlighting. It supports more than 100 languages. This example is in C++. All you have to do is wrap your code in markdown code tags:

```c++
+        a post with code | X - LANCE                  

a post with code

This theme implements a built-in Jekyll feature, the use of Rouge, for syntax highlighting. It supports more than 100 languages. This example is in C++. All you have to do is wrap your code in markdown code tags:

```c++
 code code code
 ```
 
int main(int argc, char const \*argv[])
diff --git a/zh/blog/2015/disqus-comments/index.html b/zh/blog/2015/disqus-comments/index.html
index 805585dffa2a..bcbce1ded7b9 100644
--- a/zh/blog/2015/disqus-comments/index.html
+++ b/zh/blog/2015/disqus-comments/index.html
@@ -1 +1 @@
-        a post with disqus comments | X - LANCE                  

a post with disqus comments

This post shows how to add DISQUS comments.

© Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
\ No newline at end of file + a post with disqus comments | X - LANCE

a post with disqus comments

This post shows how to add DISQUS comments.

© Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
\ No newline at end of file diff --git a/zh/blog/2015/formatting-and-links/index.html b/zh/blog/2015/formatting-and-links/index.html index 0c9eac616625..e3c4894b95f4 100644 --- a/zh/blog/2015/formatting-and-links/index.html +++ b/zh/blog/2015/formatting-and-links/index.html @@ -1 +1 @@ - a post with formatting and links | X - LANCE

a post with formatting and links

Jean shorts raw denim Vice normcore, art party High Life PBR skateboard stumptown vinyl kitsch. Four loko meh 8-bit, tousled banh mi tilde forage Schlitz dreamcatcher twee 3 wolf moon. Chambray asymmetrical paleo salvia, sartorial umami four loko master cleanse drinking vinegar brunch. Pinterest DIY authentic Schlitz, hoodie Intelligentsia butcher trust fund brunch shabby chic Kickstarter forage flexitarian. Direct trade cold-pressed meggings stumptown plaid, pop-up taxidermy. Hoodie XOXO fingerstache scenester Echo Park. Plaid ugh Wes Anderson, freegan pug selvage fanny pack leggings pickled food truck DIY irony Banksy.

Hipster list

  • brunch
  • fixie
  • raybans
  • messenger bag

Check List

  • Brush Teeth
  • Put on socks
    • Put on left sock
    • Put on right sock
  • Go to school

Hoodie Thundercats retro, tote bag 8-bit Godard craft beer gastropub. Truffaut Tumblr taxidermy, raw denim Kickstarter sartorial dreamcatcher. Quinoa chambray slow-carb salvia readymade, bicycle rights 90’s yr typewriter selfies letterpress cardigan vegan.


Pug heirloom High Life vinyl swag, single-origin coffee four dollar toast taxidermy reprehenderit fap distillery master cleanse locavore. Est anim sapiente leggings Brooklyn ea. Thundercats locavore excepteur veniam eiusmod. Raw denim Truffaut Schlitz, migas sapiente Portland VHS twee Bushwick Marfa typewriter retro id keytar.

We do not grow absolutely, chronologically. We grow sometimes in one dimension, and not in another, unevenly. We grow partially. We are relative. We are mature in one realm, childish in another. —Anais Nin

Fap aliqua qui, scenester pug Echo Park polaroid irony shabby chic ex cardigan church-key Odd Future accusamus. Blog stumptown sartorial squid, gastropub duis aesthetic Truffaut vero. Pinterest tilde twee, odio mumblecore jean shorts lumbersexual.




    喜欢阅读这篇文章吗?

    这里有一些您可能喜欢的下一篇文章:

  • a post with formatting and links
  • a post with table of contents
  • a post with table of contents on a sidebar
  • a distill-style blog post
  • displaying beautiful tables with Bootstrap Tables
  • © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
    \ No newline at end of file + a post with formatting and links | X - LANCE

    a post with formatting and links

    Jean shorts raw denim Vice normcore, art party High Life PBR skateboard stumptown vinyl kitsch. Four loko meh 8-bit, tousled banh mi tilde forage Schlitz dreamcatcher twee 3 wolf moon. Chambray asymmetrical paleo salvia, sartorial umami four loko master cleanse drinking vinegar brunch. Pinterest DIY authentic Schlitz, hoodie Intelligentsia butcher trust fund brunch shabby chic Kickstarter forage flexitarian. Direct trade cold-pressed meggings stumptown plaid, pop-up taxidermy. Hoodie XOXO fingerstache scenester Echo Park. Plaid ugh Wes Anderson, freegan pug selvage fanny pack leggings pickled food truck DIY irony Banksy.

    Hipster list

    • brunch
    • fixie
    • raybans
    • messenger bag

    Check List

    • Brush Teeth
    • Put on socks
      • Put on left sock
      • Put on right sock
    • Go to school

    Hoodie Thundercats retro, tote bag 8-bit Godard craft beer gastropub. Truffaut Tumblr taxidermy, raw denim Kickstarter sartorial dreamcatcher. Quinoa chambray slow-carb salvia readymade, bicycle rights 90’s yr typewriter selfies letterpress cardigan vegan.


    Pug heirloom High Life vinyl swag, single-origin coffee four dollar toast taxidermy reprehenderit fap distillery master cleanse locavore. Est anim sapiente leggings Brooklyn ea. Thundercats locavore excepteur veniam eiusmod. Raw denim Truffaut Schlitz, migas sapiente Portland VHS twee Bushwick Marfa typewriter retro id keytar.

    We do not grow absolutely, chronologically. We grow sometimes in one dimension, and not in another, unevenly. We grow partially. We are relative. We are mature in one realm, childish in another. —Anais Nin

    Fap aliqua qui, scenester pug Echo Park polaroid irony shabby chic ex cardigan church-key Odd Future accusamus. Blog stumptown sartorial squid, gastropub duis aesthetic Truffaut vero. Pinterest tilde twee, odio mumblecore jean shorts lumbersexual.




      喜欢阅读这篇文章吗?

      这里有一些您可能喜欢的下一篇文章:

    • a post with formatting and links
    • a post with table of contents
    • a post with table of contents on a sidebar
    • a distill-style blog post
    • displaying beautiful tables with Bootstrap Tables
    • © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
      \ No newline at end of file diff --git a/zh/blog/2015/images/index.html b/zh/blog/2015/images/index.html index 6f9e734457f8..f33280c8e153 100644 --- a/zh/blog/2015/images/index.html +++ b/zh/blog/2015/images/index.html @@ -1 +1 @@ - a post with images | X - LANCE

      a post with images

      This is an example post with image galleries.

      A simple, elegant caption looks good between image rows, after each row, or doesn't have to be there at all.

      Images can be made zoomable. Simply add data-zoomable to <img> tags that you want to make zoomable.

      The rest of the images in this post are all zoomable, arranged into different mini-galleries.




        喜欢阅读这篇文章吗?

        这里有一些您可能喜欢的下一篇文章:

      • a post with images
      • a post with videos
      • a post with audios
      • a post with advanced image components
      • a distill-style blog post
      • © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
        \ No newline at end of file + a post with images | X - LANCE

        a post with images

        This is an example post with image galleries.

        A simple, elegant caption looks good between image rows, after each row, or doesn't have to be there at all.

        Images can be made zoomable. Simply add data-zoomable to <img> tags that you want to make zoomable.

        The rest of the images in this post are all zoomable, arranged into different mini-galleries.




          喜欢阅读这篇文章吗?

          这里有一些您可能喜欢的下一篇文章:

        • a post with images
        • a post with videos
        • a post with audios
        • a post with advanced image components
        • a distill-style blog post
        • © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
          \ No newline at end of file diff --git a/zh/blog/2015/index.html b/zh/blog/2015/index.html index b928a0630c15..f9062f3b59d1 100644 --- a/zh/blog/2015/index.html +++ b/zh/blog/2015/index.html @@ -1 +1 @@ - 2015 | X - LANCE

          2015

          该年份的文章存档

          © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
          \ No newline at end of file + 2015 | X - LANCE

          2015

          该年份的文章存档

          © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
          \ No newline at end of file diff --git a/zh/blog/2015/math/index.html b/zh/blog/2015/math/index.html index ea38fda5e9a3..d689fca18443 100644 --- a/zh/blog/2015/math/index.html +++ b/zh/blog/2015/math/index.html @@ -1 +1 @@ - a post with math | X - LANCE

          a post with math

          This theme supports rendering beautiful math in inline and display modes using MathJax 3 engine. You just need to surround your math expression with $$, like $$ E = mc^2 $$. If you leave it inside a paragraph, it will produce an inline expression, just like \(E = mc^2\).

          To use display mode, again surround your expression with $$ and place it as a separate paragraph. Here is an example:

          \[\sum_{k=1}^\infty |\langle x, e_k \rangle|^2 \leq \|x\|^2\]

          You can also use \begin{equation}...\end{equation} instead of $$ for display mode math. MathJax will automatically number equations:

          \begin{equation} \label{eq:cauchy-schwarz} \left( \sum{k=1}^n a_k b_k \right)^2 \leq \left( \sum{k=1}^n ak^2 \right) \left( \sum{k=1}^n b_k^2 \right) \end{equation}

          and by adding \label{...} inside the equation environment, we can now refer to the equation using \eqref.

          Note that MathJax 3 is a major re-write of MathJax that brought a significant improvement to the loading and rendering speed, which is now on par with KaTeX.

          © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
          \ No newline at end of file + a post with math | X - LANCE

          a post with math

          This theme supports rendering beautiful math in inline and display modes using MathJax 3 engine. You just need to surround your math expression with $$, like $$ E = mc^2 $$. If you leave it inside a paragraph, it will produce an inline expression, just like \(E = mc^2\).

          To use display mode, again surround your expression with $$ and place it as a separate paragraph. Here is an example:

          \[\sum_{k=1}^\infty |\langle x, e_k \rangle|^2 \leq \|x\|^2\]

          You can also use \begin{equation}...\end{equation} instead of $$ for display mode math. MathJax will automatically number equations:

          \begin{equation} \label{eq:cauchy-schwarz} \left( \sum{k=1}^n a_k b_k \right)^2 \leq \left( \sum{k=1}^n ak^2 \right) \left( \sum{k=1}^n b_k^2 \right) \end{equation}

          and by adding \label{...} inside the equation environment, we can now refer to the equation using \eqref.

          Note that MathJax 3 is a major re-write of MathJax that brought a significant improvement to the loading and rendering speed, which is now on par with KaTeX.

          © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
          \ No newline at end of file diff --git a/zh/blog/2018/distill/index.html b/zh/blog/2018/distill/index.html index 7a53373be24b..a4475c49e477 100644 --- a/zh/blog/2018/distill/index.html +++ b/zh/blog/2018/distill/index.html @@ -54,7 +54,7 @@ ] } } -

          a distill-style blog post

          an example of a distill-style blog post and main elements

          Equations

          This theme supports rendering beautiful math in inline and display modes using MathJax 3 engine. You just need to surround your math expression with $$, like $$ E = mc^2 $$. If you leave it inside a paragraph, it will produce an inline expression, just like \(E = mc^2\).

          To use display mode, again surround your expression with $$ and place it as a separate paragraph. Here is an example:

          \[\left( \sum_{k=1}^n a_k b_k \right)^2 \leq \left( \sum_{k=1}^n a_k^2 \right) \left( \sum_{k=1}^n b_k^2 \right)\]

          Note that MathJax 3 is a major re-write of MathJax that brought a significant improvement to the loading and rendering speed, which is now on par with KaTeX.


          Citations

          Citations are then used in the article body with the <d-cite> tag. The key attribute is a reference to the id provided in the bibliography. The key attribute can take multiple ids, separated by commas.

          The citation is presented inline like this: (a number that displays more information on hover). If you have an appendix, a bibliography is automatically created and populated in it.

          Distill chose a numerical inline citation style to improve readability of citation dense articles and because many of the benefits of longer citations are obviated by displaying more information on hover. However, we consider it good style to mention author last names if you discuss something at length and it fits into the flow well — the authors are human and it’s nice for them to have the community associate them with their work.


          Footnotes

          Just wrap the text you would like to show up in a footnote in a <d-footnote> tag. The number of the footnote will be automatically generated.This will become a hoverable footnote.


          Code Blocks

          Syntax highlighting is provided within <d-code> tags. An example of inline code snippets: <d-code language="html">let x = 10;</d-code>. For larger blocks of code, add a block attribute:

          var x = 25; function(x) { return x * x; }

          Note: <d-code> blocks do not look good in the dark mode. You can always use the default code-highlight using the highlight liquid tag:

          var x = 25;
          +      

          a distill-style blog post

          an example of a distill-style blog post and main elements

          Equations

          This theme supports rendering beautiful math in inline and display modes using MathJax 3 engine. You just need to surround your math expression with $$, like $$ E = mc^2 $$. If you leave it inside a paragraph, it will produce an inline expression, just like \(E = mc^2\).

          To use display mode, again surround your expression with $$ and place it as a separate paragraph. Here is an example:

          \[\left( \sum_{k=1}^n a_k b_k \right)^2 \leq \left( \sum_{k=1}^n a_k^2 \right) \left( \sum_{k=1}^n b_k^2 \right)\]

          Note that MathJax 3 is a major re-write of MathJax that brought a significant improvement to the loading and rendering speed, which is now on par with KaTeX.


          Citations

          Citations are then used in the article body with the <d-cite> tag. The key attribute is a reference to the id provided in the bibliography. The key attribute can take multiple ids, separated by commas.

          The citation is presented inline like this: (a number that displays more information on hover). If you have an appendix, a bibliography is automatically created and populated in it.

          Distill chose a numerical inline citation style to improve readability of citation dense articles and because many of the benefits of longer citations are obviated by displaying more information on hover. However, we consider it good style to mention author last names if you discuss something at length and it fits into the flow well — the authors are human and it’s nice for them to have the community associate them with their work.


          Footnotes

          Just wrap the text you would like to show up in a footnote in a <d-footnote> tag. The number of the footnote will be automatically generated.This will become a hoverable footnote.


          Code Blocks

          Syntax highlighting is provided within <d-code> tags. An example of inline code snippets: <d-code language="html">let x = 10;</d-code>. For larger blocks of code, add a block attribute:

          var x = 25; function(x) { return x * x; }

          Note: <d-code> blocks do not look good in the dark mode. You can always use the default code-highlight using the highlight liquid tag:

          var x = 25;
           function(x) {
           return x \* x;
           }

          Interactive Plots

          You can add interative plots using plotly + iframes :framed_picture:

          The plot must be generated separately and saved into an HTML file. To generate the plot that you see above, you can use the following code snippet:

          import pandas as pd
          diff --git a/zh/blog/2018/index.html b/zh/blog/2018/index.html
          index ebc92665931f..ab31c4128c13 100644
          --- a/zh/blog/2018/index.html
          +++ b/zh/blog/2018/index.html
          @@ -1 +1 @@
          -        2018 | X - LANCE                  

          2018

          该年份的文章存档

          © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
          \ No newline at end of file + 2018 | X - LANCE

          2018

          该年份的文章存档

          © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
          \ No newline at end of file diff --git a/zh/blog/2020/github-metadata/index.html b/zh/blog/2020/github-metadata/index.html index 617807b14602..474739e590c3 100644 --- a/zh/blog/2020/github-metadata/index.html +++ b/zh/blog/2020/github-metadata/index.html @@ -1 +1 @@ - a post with github metadata | X - LANCE

          a post with github metadata

          A sample blog page that demonstrates the accessing of github meta data.

          What does Github-MetaData do?

          • Propagates the site.github namespace with repository metadata
          • Setting site variables :
            • site.title
            • site.description
            • site.url
            • site.baseurl
          • Accessing the metadata - duh.
          • Generating edittable links.

          Additional Reading

          • If you’re recieving incorrect/missing data, you may need to perform a Github API authentication.
          • Go through this README for more details on the topic.
          • This page highlights all the feilds you can access with github-metadata.

          Example MetaData

          • Host Name :
          • URL :
          • BaseURL :
          • Archived :
          • Contributors :



            喜欢阅读这篇文章吗?

            这里有一些您可能喜欢的下一篇文章:

          • a post with github metadata
          • a post with twitter
          • a distill-style blog post
          • a post with code
          • a post with jupyter notebook
          • © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
            \ No newline at end of file + a post with github metadata | X - LANCE

            a post with github metadata

            A sample blog page that demonstrates the accessing of github meta data.

            What does Github-MetaData do?

            • Propagates the site.github namespace with repository metadata
            • Setting site variables :
              • site.title
              • site.description
              • site.url
              • site.baseurl
            • Accessing the metadata - duh.
            • Generating edittable links.

            Additional Reading

            • If you’re recieving incorrect/missing data, you may need to perform a Github API authentication.
            • Go through this README for more details on the topic.
            • This page highlights all the feilds you can access with github-metadata.

            Example MetaData

            • Host Name :
            • URL :
            • BaseURL :
            • Archived :
            • Contributors :



              喜欢阅读这篇文章吗?

              这里有一些您可能喜欢的下一篇文章:

            • a post with github metadata
            • a post with twitter
            • a distill-style blog post
            • a post with code
            • a post with jupyter notebook
            • © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
              \ No newline at end of file diff --git a/zh/blog/2020/index.html b/zh/blog/2020/index.html index c10c7ee34e7f..05e7dd9c396f 100644 --- a/zh/blog/2020/index.html +++ b/zh/blog/2020/index.html @@ -1 +1 @@ - 2020 | X - LANCE

              2020

              该年份的文章存档

              © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
              \ No newline at end of file + 2020 | X - LANCE

              2020

              该年份的文章存档

              © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
              \ No newline at end of file diff --git a/zh/blog/2020/twitter/index.html b/zh/blog/2020/twitter/index.html index 75c966ea3667..92759509e751 100644 --- a/zh/blog/2020/twitter/index.html +++ b/zh/blog/2020/twitter/index.html @@ -1 +1 @@ - a post with twitter | X - LANCE

              a post with twitter

              A sample blog page that demonstrates the inclusion of Tweets/Timelines/etc.

              Tweet

              An example of displaying a tweet:

              Timeline

              An example of pulling from a timeline:

              Additional Details

              For more details on using the plugin visit: jekyll-twitter-plugin




                喜欢阅读这篇文章吗?

                这里有一些您可能喜欢的下一篇文章:

              • a distill-style blog post
              • a post with videos
              • a post with code
              • a post with github metadata
              • a post with jupyter notebook
              • © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                \ No newline at end of file + a post with twitter | X - LANCE

                a post with twitter

                A sample blog page that demonstrates the inclusion of Tweets/Timelines/etc.

                Tweet

                An example of displaying a tweet:

                Timeline

                An example of pulling from a timeline:

                Additional Details

                For more details on using the plugin visit: jekyll-twitter-plugin




                  喜欢阅读这篇文章吗?

                  这里有一些您可能喜欢的下一篇文章:

                • a distill-style blog post
                • a post with videos
                • a post with code
                • a post with github metadata
                • a post with jupyter notebook
                • © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                  \ No newline at end of file diff --git a/zh/blog/2021/diagrams/index.html b/zh/blog/2021/diagrams/index.html index 110b4e0b5704..bc4253e087bc 100644 --- a/zh/blog/2021/diagrams/index.html +++ b/zh/blog/2021/diagrams/index.html @@ -1,4 +1,4 @@ - a post with diagrams | X - LANCE

                  a post with diagrams

                  This theme supports generating various diagrams from a text description using mermaid. Previously, this was done using the jekyll-diagrams plugin. For more information on this matter, see the related issue. To disable the zooming feature, set mermaid.zoomable to false in this post frontmatter.

                  Mermaid

                  The diagram below was generated by the following code:

                  ```mermaid
                  +        a post with diagrams | X - LANCE                  

                  a post with diagrams

                  This theme supports generating various diagrams from a text description using mermaid. Previously, this was done using the jekyll-diagrams plugin. For more information on this matter, see the related issue. To disable the zooming feature, set mermaid.zoomable to false in this post frontmatter.

                  Mermaid

                  The diagram below was generated by the following code:

                  ```mermaid
                   sequenceDiagram
                       participant John
                       participant Alice
                  diff --git a/zh/blog/2021/index.html b/zh/blog/2021/index.html
                  index 3882dcac1d65..9a61751ea357 100644
                  --- a/zh/blog/2021/index.html
                  +++ b/zh/blog/2021/index.html
                  @@ -1 +1 @@
                  -        2021 | X - LANCE                  

                  2021

                  该年份的文章存档

                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                  \ No newline at end of file + 2021 | X - LANCE

                  2021

                  该年份的文章存档

                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                  \ No newline at end of file diff --git a/zh/blog/2022/giscus-comments/index.html b/zh/blog/2022/giscus-comments/index.html index 6348f1aa1803..da12f88f568e 100644 --- a/zh/blog/2022/giscus-comments/index.html +++ b/zh/blog/2022/giscus-comments/index.html @@ -1 +1 @@ - a post with giscus comments | X - LANCE

                  a post with giscus comments

                  This post shows how to add GISCUS comments.

                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                  \ No newline at end of file + a post with giscus comments | X - LANCE

                  a post with giscus comments

                  This post shows how to add GISCUS comments.

                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                  \ No newline at end of file diff --git a/zh/blog/2022/index.html b/zh/blog/2022/index.html index 96baa9f3440a..bc7b2deeb04f 100644 --- a/zh/blog/2022/index.html +++ b/zh/blog/2022/index.html @@ -1 +1 @@ - 2022 | X - LANCE

                  2022

                  该年份的文章存档

                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                  \ No newline at end of file + 2022 | X - LANCE

                  2022

                  该年份的文章存档

                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                  \ No newline at end of file diff --git a/zh/blog/2022/redirect/index.html b/zh/blog/2022/redirect/index.html index ab9576ed5859..3ee227a5f462 100644 --- a/zh/blog/2022/redirect/index.html +++ b/zh/blog/2022/redirect/index.html @@ -1 +1 @@ - a post with redirect | X - LANCE

                  a post with redirect

                  Redirecting to another page or file. Note that pages without any text, with very short texts or formed only by words without much meaning can cause problems for the generation of related posts.




                    喜欢阅读这篇文章吗?

                    这里有一些您可能喜欢的下一篇文章:

                  • a distill-style blog post
                  • a post with echarts
                  • a post with code diff
                  • a post with jupyter notebook
                  • a post with diagrams
                  • © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                    \ No newline at end of file + a post with redirect | X - LANCE

                    a post with redirect

                    Redirecting to another page or file. Note that pages without any text, with very short texts or formed only by words without much meaning can cause problems for the generation of related posts.




                      喜欢阅读这篇文章吗?

                      这里有一些您可能喜欢的下一篇文章:

                    • a distill-style blog post
                    • a post with echarts
                    • a post with code diff
                    • a post with jupyter notebook
                    • a post with diagrams
                    • © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                      \ No newline at end of file diff --git a/zh/blog/2023/audios/index.html b/zh/blog/2023/audios/index.html index 5302b2d2841e..f8ff104c2d6b 100644 --- a/zh/blog/2023/audios/index.html +++ b/zh/blog/2023/audios/index.html @@ -1 +1 @@ - a post with audios | X - LANCE

                      a post with audios

                      This is an example post with audios. It supports local audio files.

                      A simple, elegant caption looks good between video rows, after each row, or doesn't have to be there at all.



                        喜欢阅读这篇文章吗?

                        这里有一些您可能喜欢的下一篇文章:

                      • a post with videos
                      • a post with images
                      • a post with audios
                      • a distill-style blog post
                      • a post with bibliography
                      • © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                        \ No newline at end of file + a post with audios | X - LANCE

                        a post with audios

                        This is an example post with audios. It supports local audio files.

                        A simple, elegant caption looks good between video rows, after each row, or doesn't have to be there at all.



                          喜欢阅读这篇文章吗?

                          这里有一些您可能喜欢的下一篇文章:

                        • a post with videos
                        • a post with images
                        • a post with audios
                        • a distill-style blog post
                        • a post with bibliography
                        • © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                          \ No newline at end of file diff --git a/zh/blog/2023/custom-blockquotes/index.html b/zh/blog/2023/custom-blockquotes/index.html index e23268470fb0..07c33a2edbb2 100644 --- a/zh/blog/2023/custom-blockquotes/index.html +++ b/zh/blog/2023/custom-blockquotes/index.html @@ -1,4 +1,4 @@ - a post with custom blockquotes | X - LANCE

                          a post with custom blockquotes

                          This post shows how to add custom styles for blockquotes. Based on jekyll-gitbook implementation.

                          We decided to support the same custom blockquotes as in jekyll-gitbook, which are also found in a lot of other sites’ styles. The styles definitions can be found on the _base.scss file, more specifically:

                          /* Tips, warnings, and dangers */
                          +        a post with custom blockquotes | X - LANCE                  

                          a post with custom blockquotes

                          This post shows how to add custom styles for blockquotes. Based on jekyll-gitbook implementation.

                          We decided to support the same custom blockquotes as in jekyll-gitbook, which are also found in a lot of other sites’ styles. The styles definitions can be found on the _base.scss file, more specifically:

                          /* Tips, warnings, and dangers */
                           .post .post-content blockquote {
                             &.block-tip {
                               border-color: var(--global-tip-block);
                          diff --git a/zh/blog/2023/index.html b/zh/blog/2023/index.html
                          index 354e27559a9c..fe8dcb0ddf0f 100644
                          --- a/zh/blog/2023/index.html
                          +++ b/zh/blog/2023/index.html
                          @@ -1 +1 @@
                          -        2023 | X - LANCE                  

                          2023

                          该年份的文章存档

                          © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                          \ No newline at end of file + 2023 | X - LANCE

                          2023

                          该年份的文章存档

                          © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                          \ No newline at end of file diff --git a/zh/blog/2023/jupyter-notebook/index.html b/zh/blog/2023/jupyter-notebook/index.html index 01ca4de7386c..66084ce3a758 100644 --- a/zh/blog/2023/jupyter-notebook/index.html +++ b/zh/blog/2023/jupyter-notebook/index.html @@ -1,4 +1,4 @@ - a post with jupyter notebook | X - LANCE

                          a post with jupyter notebook

                          To include a jupyter notebook in a post, you can use the following code:

                          {::nomarkdown}
                          +        a post with jupyter notebook | X - LANCE                  

                          a post with jupyter notebook

                          To include a jupyter notebook in a post, you can use the following code:

                          {::nomarkdown}
                           {% assign jupyter_path = 'assets/jupyter/blog.ipynb' | relative_url %}
                           {% capture notebook_exists %}{% file_exists assets/jupyter/blog.ipynb %}{% endcapture %}
                           {% if notebook_exists == 'true' %}
                          diff --git a/zh/blog/2023/post-bibliography/index.html b/zh/blog/2023/post-bibliography/index.html
                          index 51918d885390..75acf5451c18 100644
                          --- a/zh/blog/2023/post-bibliography/index.html
                          +++ b/zh/blog/2023/post-bibliography/index.html
                          @@ -1 +1 @@
                          -        a post with bibliography | X - LANCE                  

                          a post with bibliography

                          This post shows how to add bibliography to simple blog posts. We support every citation style that jekyll-scholar does. That means simple citation like (missing reference), multiple citations like (missing reference), long references like (missing reference) or also quotes:

                          Lorem ipsum dolor sit amet, consectetur adipisicing elit,
                          sed do eiusmod tempor.

                          Lorem ipsum dolor sit amet, consectetur adipisicing.

                          (missing reference)

                          If you would like something more academic, check the distill style post.

                          参考文献

                          © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                          \ No newline at end of file + a post with bibliography | X - LANCE

                          a post with bibliography

                          This post shows how to add bibliography to simple blog posts. We support every citation style that jekyll-scholar does. That means simple citation like (missing reference), multiple citations like (missing reference), long references like (missing reference) or also quotes:

                          Lorem ipsum dolor sit amet, consectetur adipisicing elit,
                          sed do eiusmod tempor.

                          Lorem ipsum dolor sit amet, consectetur adipisicing.

                          (missing reference)

                          If you would like something more academic, check the distill style post.

                          参考文献

                          © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                          \ No newline at end of file diff --git a/zh/blog/2023/sidebar-table-of-contents/index.html b/zh/blog/2023/sidebar-table-of-contents/index.html index f009c842d547..71f134adce06 100644 --- a/zh/blog/2023/sidebar-table-of-contents/index.html +++ b/zh/blog/2023/sidebar-table-of-contents/index.html @@ -1,3 +1,3 @@ - a post with table of contents on a sidebar | X - LANCE

                          a post with table of contents on a sidebar

                          This post shows how to add a table of contents as a sidebar.

                          Adding a Table of Contents

                          To add a table of contents to a post as a sidebar, simply add

                          toc:
                          +        a post with table of contents on a sidebar | X - LANCE                   

                          a post with table of contents on a sidebar

                          This post shows how to add a table of contents as a sidebar.

                          Adding a Table of Contents

                          To add a table of contents to a post as a sidebar, simply add

                          toc:
                             sidebar: left
                           

                          to the front matter of the post. The table of contents will be automatically generated from the headings in the post. If you wish to display the sidebar to the right, simply change left to right.

                          Example of Sub-Heading 1

                          Jean shorts raw denim Vice normcore, art party High Life PBR skateboard stumptown vinyl kitsch. Four loko meh 8-bit, tousled banh mi tilde forage Schlitz dreamcatcher twee 3 wolf moon. Chambray asymmetrical paleo salvia, sartorial umami four loko master cleanse drinking vinegar brunch. Pinterest DIY authentic Schlitz, hoodie Intelligentsia butcher trust fund brunch shabby chic Kickstarter forage flexitarian. Direct trade cold-pressed meggings stumptown plaid, pop-up taxidermy. Hoodie XOXO fingerstache scenester Echo Park. Plaid ugh Wes Anderson, freegan pug selvage fanny pack leggings pickled food truck DIY irony Banksy.

                          Example of another Sub-Heading 1

                          Jean shorts raw denim Vice normcore, art party High Life PBR skateboard stumptown vinyl kitsch. Four loko meh 8-bit, tousled banh mi tilde forage Schlitz dreamcatcher twee 3 wolf moon. Chambray asymmetrical paleo salvia, sartorial umami four loko master cleanse drinking vinegar brunch. Pinterest DIY authentic Schlitz, hoodie Intelligentsia butcher trust fund brunch shabby chic Kickstarter forage flexitarian. Direct trade cold-pressed meggings stumptown plaid, pop-up taxidermy. Hoodie XOXO fingerstache scenester Echo Park. Plaid ugh Wes Anderson, freegan pug selvage fanny pack leggings pickled food truck DIY irony Banksy.

                          Customizing Your Table of Contents

                          If you want to learn more about how to customize the table of contents of your sidebar, you can check the bootstrap-toc documentation. Notice that you can even customize the text of the heading that will be displayed on the sidebar.

                          Example of Sub-Heading 2

                          Jean shorts raw denim Vice normcore, art party High Life PBR skateboard stumptown vinyl kitsch. Four loko meh 8-bit, tousled banh mi tilde forage Schlitz dreamcatcher twee 3 wolf moon. Chambray asymmetrical paleo salvia, sartorial umami four loko master cleanse drinking vinegar brunch. Pinterest DIY authentic Schlitz, hoodie Intelligentsia butcher trust fund brunch shabby chic Kickstarter forage flexitarian. Direct trade cold-pressed meggings stumptown plaid, pop-up taxidermy. Hoodie XOXO fingerstache scenester Echo Park. Plaid ugh Wes Anderson, freegan pug selvage fanny pack leggings pickled food truck DIY irony Banksy.

                          Example of another Sub-Heading 2

                          Jean shorts raw denim Vice normcore, art party High Life PBR skateboard stumptown vinyl kitsch. Four loko meh 8-bit, tousled banh mi tilde forage Schlitz dreamcatcher twee 3 wolf moon. Chambray asymmetrical paleo salvia, sartorial umami four loko master cleanse drinking vinegar brunch. Pinterest DIY authentic Schlitz, hoodie Intelligentsia butcher trust fund brunch shabby chic Kickstarter forage flexitarian. Direct trade cold-pressed meggings stumptown plaid, pop-up taxidermy. Hoodie XOXO fingerstache scenester Echo Park. Plaid ugh Wes Anderson, freegan pug selvage fanny pack leggings pickled food truck DIY irony Banksy.

                          © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                          \ No newline at end of file diff --git a/zh/blog/2023/table-of-contents/index.html b/zh/blog/2023/table-of-contents/index.html index 28cd1502b002..a11c82e13e91 100644 --- a/zh/blog/2023/table-of-contents/index.html +++ b/zh/blog/2023/table-of-contents/index.html @@ -1,3 +1,3 @@ - a post with table of contents | X - LANCE

                          a post with table of contents


                          This post shows how to add a table of contents in the beginning of the post.

                          Adding a Table of Contents

                          To add a table of contents to a post, simply add

                          toc:
                          +        a post with table of contents | X - LANCE                  

                          a post with table of contents


                          This post shows how to add a table of contents in the beginning of the post.

                          Adding a Table of Contents

                          To add a table of contents to a post, simply add

                          toc:
                             beginning: true
                           

                          to the front matter of the post. The table of contents will be automatically generated from the headings in the post.

                          Example of Sub-Heading 1

                          Jean shorts raw denim Vice normcore, art party High Life PBR skateboard stumptown vinyl kitsch. Four loko meh 8-bit, tousled banh mi tilde forage Schlitz dreamcatcher twee 3 wolf moon. Chambray asymmetrical paleo salvia, sartorial umami four loko master cleanse drinking vinegar brunch. Pinterest DIY authentic Schlitz, hoodie Intelligentsia butcher trust fund brunch shabby chic Kickstarter forage flexitarian. Direct trade cold-pressed meggings stumptown plaid, pop-up taxidermy. Hoodie XOXO fingerstache scenester Echo Park. Plaid ugh Wes Anderson, freegan pug selvage fanny pack leggings pickled food truck DIY irony Banksy.

                          Example of another Sub-Heading 1

                          Jean shorts raw denim Vice normcore, art party High Life PBR skateboard stumptown vinyl kitsch. Four loko meh 8-bit, tousled banh mi tilde forage Schlitz dreamcatcher twee 3 wolf moon. Chambray asymmetrical paleo salvia, sartorial umami four loko master cleanse drinking vinegar brunch. Pinterest DIY authentic Schlitz, hoodie Intelligentsia butcher trust fund brunch shabby chic Kickstarter forage flexitarian. Direct trade cold-pressed meggings stumptown plaid, pop-up taxidermy. Hoodie XOXO fingerstache scenester Echo Park. Plaid ugh Wes Anderson, freegan pug selvage fanny pack leggings pickled food truck DIY irony Banksy.

                          Table of Contents Options

                          If you want to learn more about how to customize the table of contents, you can check the jekyll-toc repository.

                          Example of Sub-Heading 2

                          Jean shorts raw denim Vice normcore, art party High Life PBR skateboard stumptown vinyl kitsch. Four loko meh 8-bit, tousled banh mi tilde forage Schlitz dreamcatcher twee 3 wolf moon. Chambray asymmetrical paleo salvia, sartorial umami four loko master cleanse drinking vinegar brunch. Pinterest DIY authentic Schlitz, hoodie Intelligentsia butcher trust fund brunch shabby chic Kickstarter forage flexitarian. Direct trade cold-pressed meggings stumptown plaid, pop-up taxidermy. Hoodie XOXO fingerstache scenester Echo Park. Plaid ugh Wes Anderson, freegan pug selvage fanny pack leggings pickled food truck DIY irony Banksy.

                          Example of another Sub-Heading 2

                          Jean shorts raw denim Vice normcore, art party High Life PBR skateboard stumptown vinyl kitsch. Four loko meh 8-bit, tousled banh mi tilde forage Schlitz dreamcatcher twee 3 wolf moon. Chambray asymmetrical paleo salvia, sartorial umami four loko master cleanse drinking vinegar brunch. Pinterest DIY authentic Schlitz, hoodie Intelligentsia butcher trust fund brunch shabby chic Kickstarter forage flexitarian. Direct trade cold-pressed meggings stumptown plaid, pop-up taxidermy. Hoodie XOXO fingerstache scenester Echo Park. Plaid ugh Wes Anderson, freegan pug selvage fanny pack leggings pickled food truck DIY irony Banksy.

                          © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                          \ No newline at end of file diff --git a/zh/blog/2023/tables/index.html b/zh/blog/2023/tables/index.html index ea3d80183f90..0e2923f3bbc2 100644 --- a/zh/blog/2023/tables/index.html +++ b/zh/blog/2023/tables/index.html @@ -1,4 +1,4 @@ - displaying beautiful tables with Bootstrap Tables | X - LANCE

                          displaying beautiful tables with Bootstrap Tables

                          Using markdown to display tables is easy. Just use the following syntax:

                          | Left aligned | Center aligned | Right aligned |
                          +        displaying beautiful tables with Bootstrap Tables | X - LANCE                   

                          displaying beautiful tables with Bootstrap Tables

                          Using markdown to display tables is easy. Just use the following syntax:

                          | Left aligned | Center aligned | Right aligned |
                           | :----------- | :------------: | ------------: |
                           | Left 1       |    center 1    |       right 1 |
                           | Left 2       |    center 2    |       right 2 |
                          diff --git a/zh/blog/2023/tikzjax/index.html b/zh/blog/2023/tikzjax/index.html
                          index 1d6dc21ec3cf..83cd6b94ae2d 100644
                          --- a/zh/blog/2023/tikzjax/index.html
                          +++ b/zh/blog/2023/tikzjax/index.html
                          @@ -1,4 +1,4 @@
                          -        a post with TikZJax | X - LANCE                   

                          a post with TikZJax

                          This is an example post with TikZ code. TikZJax converts script tags (containing TikZ code) into SVGs.

                          a post with TikZJax

                          This is an example post with TikZ code. TikZJax converts script tags (containing TikZ code) into SVGs.

                          a post with videos

                          This is an example post with videos. It supports local video files.

                          A simple, elegant caption looks good between video rows, after each row, or doesn't have to be there at all.

                          It does also support embedding videos from different sources. Here are some examples:




                            喜欢阅读这篇文章吗?

                            这里有一些您可能喜欢的下一篇文章:

                          • a post with images
                          • a post with videos
                          • a post with audios
                          • a post with advanced image components
                          • a distill-style blog post
                          • © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                            \ No newline at end of file + a post with videos | X - LANCE

                            a post with videos

                            This is an example post with videos. It supports local video files.

                            A simple, elegant caption looks good between video rows, after each row, or doesn't have to be there at all.

                            It does also support embedding videos from different sources. Here are some examples:




                              喜欢阅读这篇文章吗?

                              这里有一些您可能喜欢的下一篇文章:

                            • a post with images
                            • a post with videos
                            • a post with audios
                            • a post with advanced image components
                            • a distill-style blog post
                            • © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                              \ No newline at end of file diff --git a/zh/blog/2024/advanced-images/index.html b/zh/blog/2024/advanced-images/index.html index 37703197d683..4a6a7d6ab041 100644 --- a/zh/blog/2024/advanced-images/index.html +++ b/zh/blog/2024/advanced-images/index.html @@ -1 +1 @@ - a post with advanced image components | X - LANCE

                              a post with advanced image components

                              This is an example post with advanced image components.

                              Image Slider

                              This is a simple image slider. It uses the Swiper library. Check the examples page for more information of what you can achieve with it.

                              Image Comparison Slider

                              This is a simple image comparison slider. It uses the img-comparison-slider library. Check the examples page for more information of what you can achieve with it.




                                喜欢阅读这篇文章吗?

                                这里有一些您可能喜欢的下一篇文章:

                              • a post with advanced image components
                              • a post with images
                              • a distill-style blog post
                              • a post with videos
                              • displaying beautiful tables with Bootstrap Tables
                              • © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                \ No newline at end of file + a post with advanced image components | X - LANCE

                                a post with advanced image components

                                This is an example post with advanced image components.

                                Image Slider

                                This is a simple image slider. It uses the Swiper library. Check the examples page for more information of what you can achieve with it.

                                Image Comparison Slider

                                This is a simple image comparison slider. It uses the img-comparison-slider library. Check the examples page for more information of what you can achieve with it.




                                  喜欢阅读这篇文章吗?

                                  这里有一些您可能喜欢的下一篇文章:

                                • a post with advanced image components
                                • a post with images
                                • a distill-style blog post
                                • a post with videos
                                • displaying beautiful tables with Bootstrap Tables
                                • © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file diff --git a/zh/blog/2024/chartjs/index.html b/zh/blog/2024/chartjs/index.html index 85a1b0ee22d5..57284f149953 100644 --- a/zh/blog/2024/chartjs/index.html +++ b/zh/blog/2024/chartjs/index.html @@ -1,4 +1,4 @@ - a post with chart.js | X - LANCE

                                  a post with chart.js

                                  This is an example post with some chart.js code.

                                  ```chartjs
                                  +        a post with chart.js | X - LANCE                  

                                  a post with chart.js

                                  This is an example post with some chart.js code.

                                  ```chartjs
                                   {
                                     "type": "line",
                                     "data": {
                                  diff --git a/zh/blog/2024/code-diff/index.html b/zh/blog/2024/code-diff/index.html
                                  index 15b6b88d741c..e50a09940090 100644
                                  --- a/zh/blog/2024/code-diff/index.html
                                  +++ b/zh/blog/2024/code-diff/index.html
                                  @@ -1,4 +1,4 @@
                                  -        a post with code diff | X - LANCE                     

                                  a post with code diff

                                  You can display diff code by using the regular markdown syntax:

                                  ```diff
                                  +        a post with code diff | X - LANCE                     

                                  a post with code diff

                                  You can display diff code by using the regular markdown syntax:

                                  ```diff
                                   diff --git a/sample.js b/sample.js
                                   index 0000001..0ddf2ba
                                   --- a/sample.js
                                  diff --git a/zh/blog/2024/echarts/index.html b/zh/blog/2024/echarts/index.html
                                  index 6b3670d4d38f..490906dd57e2 100644
                                  --- a/zh/blog/2024/echarts/index.html
                                  +++ b/zh/blog/2024/echarts/index.html
                                  @@ -1,4 +1,4 @@
                                  -        a post with echarts | X - LANCE                  

                                  a post with echarts

                                  This is an example post with some echarts code.

                                  ```echarts
                                  +        a post with echarts | X - LANCE                  

                                  a post with echarts

                                  This is an example post with some echarts code.

                                  ```echarts
                                   {
                                     "title": {
                                       "text": "ECharts Getting Started Example"
                                  diff --git a/zh/blog/2024/geojson-map/index.html b/zh/blog/2024/geojson-map/index.html
                                  index 6c92f5a6b767..52dd8ef919bc 100644
                                  --- a/zh/blog/2024/geojson-map/index.html
                                  +++ b/zh/blog/2024/geojson-map/index.html
                                  @@ -1,4 +1,4 @@
                                  -        a post with geojson | X - LANCE                   

                                  a post with geojson

                                  This is an example post with some geojson code. The support is provided thanks to Leaflet. To create your own visualization, go to geojson.io.

                                  ```geojson
                                  +        a post with geojson | X - LANCE                   

                                  a post with geojson

                                  This is an example post with some geojson code. The support is provided thanks to Leaflet. To create your own visualization, go to geojson.io.

                                  ```geojson
                                   {
                                     "type": "FeatureCollection",
                                     "features": [
                                  diff --git a/zh/blog/2024/index.html b/zh/blog/2024/index.html
                                  index 1fb2f7dc48df..6a0b6e1df977 100644
                                  --- a/zh/blog/2024/index.html
                                  +++ b/zh/blog/2024/index.html
                                  @@ -1 +1 @@
                                  -        2024 | X - LANCE                  

                                  2024

                                  该年份的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file + 2024 | X - LANCE

                                  2024

                                  该年份的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file diff --git a/zh/blog/2024/vega-lite/index.html b/zh/blog/2024/vega-lite/index.html index bcc6e5e9a87f..03caba356349 100644 --- a/zh/blog/2024/vega-lite/index.html +++ b/zh/blog/2024/vega-lite/index.html @@ -1,4 +1,4 @@ - a post with vega lite | X - LANCE

                                  a post with vega lite

                                  This is an example post with some vega lite code.

                                  ```vega_lite
                                  +        a post with vega lite | X - LANCE                  

                                  a post with vega lite

                                  This is an example post with some vega lite code.

                                  ```vega_lite
                                   {
                                     "$schema": "https://vega.github.io/schema/vega-lite/v5.json",
                                     "description": "A dot plot showing each movie in the database, and the difference from the average movie rating. The display is sorted by year to visualize everything in sequential order. The graph is for all Movies before 2019.",
                                  diff --git a/zh/blog/category/external-services/index.html b/zh/blog/category/external-services/index.html
                                  index 5be99feae6e5..92a89379fe00 100644
                                  --- a/zh/blog/category/external-services/index.html
                                  +++ b/zh/blog/category/external-services/index.html
                                  @@ -1 +1 @@
                                  -        external-services | X - LANCE                  

                                  external-services

                                  该分类下的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file + external-services | X - LANCE

                                  external-services

                                  该分类下的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file diff --git a/zh/blog/category/sample-posts/index.html b/zh/blog/category/sample-posts/index.html index 981c95214fe5..4dd6796dbfdd 100644 --- a/zh/blog/category/sample-posts/index.html +++ b/zh/blog/category/sample-posts/index.html @@ -1 +1 @@ - sample-posts | X - LANCE

                                  sample-posts

                                  该分类下的文章存档

                                  2024年 1月 27日 a post with code diff
                                  2024年 1月 27日 a post with advanced image components
                                  2024年 1月 27日 a post with vega lite
                                  2024年 1月 26日 a post with geojson
                                  2024年 1月 26日 a post with echarts
                                  2024年 1月 26日 a post with chart.js
                                  2023年 12月 12日 a post with TikZJax
                                  2023年 7月 12日 a post with bibliography
                                  2023年 7月 04日 a post with jupyter notebook
                                  2023年 5月 12日 a post with custom blockquotes
                                  2023年 4月 25日 a post with table of contents on a sidebar
                                  2023年 4月 25日 a post with audios
                                  2023年 4月 24日 a post with videos
                                  2023年 3月 20日 displaying beautiful tables with Bootstrap Tables
                                  2023年 3月 20日 a post with table of contents
                                  2022年 12月 10日 a post with giscus comments
                                  2020年 9月 28日 a post with github metadata
                                  2020年 9月 28日 a post with twitter
                                  2015年 10月 20日 a post with disqus comments
                                  2015年 10月 20日 a post with math
                                  2015年 7月 15日 a post with code
                                  2015年 5月 15日 a post with images
                                  2015年 3月 15日 a post with formatting and links
                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file + sample-posts | X - LANCE

                                  sample-posts

                                  该分类下的文章存档

                                  2024年 1月 27日 a post with code diff
                                  2024年 1月 27日 a post with advanced image components
                                  2024年 1月 27日 a post with vega lite
                                  2024年 1月 26日 a post with geojson
                                  2024年 1月 26日 a post with echarts
                                  2024年 1月 26日 a post with chart.js
                                  2023年 12月 12日 a post with TikZJax
                                  2023年 7月 12日 a post with bibliography
                                  2023年 7月 04日 a post with jupyter notebook
                                  2023年 5月 12日 a post with custom blockquotes
                                  2023年 4月 25日 a post with table of contents on a sidebar
                                  2023年 4月 25日 a post with audios
                                  2023年 4月 24日 a post with videos
                                  2023年 3月 20日 displaying beautiful tables with Bootstrap Tables
                                  2023年 3月 20日 a post with table of contents
                                  2022年 12月 10日 a post with giscus comments
                                  2020年 9月 28日 a post with github metadata
                                  2020年 9月 28日 a post with twitter
                                  2015年 10月 20日 a post with disqus comments
                                  2015年 10月 20日 a post with math
                                  2015年 7月 15日 a post with code
                                  2015年 5月 15日 a post with images
                                  2015年 3月 15日 a post with formatting and links
                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file diff --git a/zh/blog/index.html b/zh/blog/index.html index a41a62dcdf3c..38e104bf112b 100644 --- a/zh/blog/index.html +++ b/zh/blog/index.html @@ -1 +1 @@ - blog | X - LANCE

                                  al-folio in english

                                  a simple whitespace theme for academics



                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file + blog | X - LANCE

                                  al-folio in english

                                  a simple whitespace theme for academics



                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file diff --git a/zh/blog/page/2/index.html b/zh/blog/page/2/index.html index 34e680c25cfa..546955e40fcb 100644 --- a/zh/blog/page/2/index.html +++ b/zh/blog/page/2/index.html @@ -1 +1 @@ - blog - 页 2 | X - LANCE

                                  al-folio in english

                                  a simple whitespace theme for academics



                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file + blog - 页 2 | X - LANCE

                                  al-folio in english

                                  a simple whitespace theme for academics



                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file diff --git a/zh/blog/page/3/index.html b/zh/blog/page/3/index.html index 252ae845ea84..31836a11f83c 100644 --- a/zh/blog/page/3/index.html +++ b/zh/blog/page/3/index.html @@ -1 +1 @@ - blog - 页 3 | X - LANCE

                                  al-folio in english

                                  a simple whitespace theme for academics



                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file + blog - 页 3 | X - LANCE

                                  al-folio in english

                                  a simple whitespace theme for academics



                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file diff --git a/zh/blog/page/4/index.html b/zh/blog/page/4/index.html index 679129a48e06..ed787ffae22f 100644 --- a/zh/blog/page/4/index.html +++ b/zh/blog/page/4/index.html @@ -1 +1 @@ - blog - 页 4 | X - LANCE

                                  al-folio in english

                                  a simple whitespace theme for academics



                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file + blog - 页 4 | X - LANCE

                                  al-folio in english

                                  a simple whitespace theme for academics



                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file diff --git a/zh/blog/page/5/index.html b/zh/blog/page/5/index.html index c7fbc52a1ef2..26f99badb60e 100644 --- a/zh/blog/page/5/index.html +++ b/zh/blog/page/5/index.html @@ -1 +1 @@ - blog - 页 5 | X - LANCE

                                  al-folio in english

                                  a simple whitespace theme for academics



                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file + blog - 页 5 | X - LANCE

                                  al-folio in english

                                  a simple whitespace theme for academics



                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file diff --git a/zh/blog/page/6/index.html b/zh/blog/page/6/index.html index 07928defe20f..d95f8f8580b1 100644 --- a/zh/blog/page/6/index.html +++ b/zh/blog/page/6/index.html @@ -1 +1 @@ - blog - 页 6 | X - LANCE

                                  al-folio in english

                                  a simple whitespace theme for academics



                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file + blog - 页 6 | X - LANCE

                                  al-folio in english

                                  a simple whitespace theme for academics



                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file diff --git a/zh/blog/tag/audios/index.html b/zh/blog/tag/audios/index.html index 6149d7d78e22..b8edc21b5bae 100644 --- a/zh/blog/tag/audios/index.html +++ b/zh/blog/tag/audios/index.html @@ -1 +1 @@ - audios | X - LANCE

                                  audios

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file + audios | X - LANCE

                                  audios

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file diff --git a/zh/blog/tag/bib/index.html b/zh/blog/tag/bib/index.html index 6cd24a3c3747..747beebb089a 100644 --- a/zh/blog/tag/bib/index.html +++ b/zh/blog/tag/bib/index.html @@ -1 +1 @@ - bib | X - LANCE

                                  bib

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file + bib | X - LANCE

                                  bib

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file diff --git a/zh/blog/tag/blockquotes/index.html b/zh/blog/tag/blockquotes/index.html index 4f7538a4c02d..018b4a4c7e7f 100644 --- a/zh/blog/tag/blockquotes/index.html +++ b/zh/blog/tag/blockquotes/index.html @@ -1 +1 @@ - blockquotes | X - LANCE

                                  blockquotes

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file + blockquotes | X - LANCE

                                  blockquotes

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file diff --git a/zh/blog/tag/charts/index.html b/zh/blog/tag/charts/index.html index dbe73a1a76b0..2a8b7a63e3af 100644 --- a/zh/blog/tag/charts/index.html +++ b/zh/blog/tag/charts/index.html @@ -1 +1 @@ - charts | X - LANCE

                                  charts

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file + charts | X - LANCE

                                  charts

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file diff --git a/zh/blog/tag/code/index.html b/zh/blog/tag/code/index.html index a0e7aeb3d9b0..c07a13c495ed 100644 --- a/zh/blog/tag/code/index.html +++ b/zh/blog/tag/code/index.html @@ -1 +1 @@ - code | X - LANCE

                                  code

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file + code | X - LANCE

                                  code

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file diff --git a/zh/blog/tag/comments/index.html b/zh/blog/tag/comments/index.html index 01d8e5235fe7..9f00faee058e 100644 --- a/zh/blog/tag/comments/index.html +++ b/zh/blog/tag/comments/index.html @@ -1 +1 @@ - comments | X - LANCE

                                  comments

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file + comments | X - LANCE

                                  comments

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file diff --git a/zh/blog/tag/diagrams/index.html b/zh/blog/tag/diagrams/index.html index d2a19c9e8fe3..c27b4ca98e52 100644 --- a/zh/blog/tag/diagrams/index.html +++ b/zh/blog/tag/diagrams/index.html @@ -1 +1 @@ - diagrams | X - LANCE

                                  diagrams

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file + diagrams | X - LANCE

                                  diagrams

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file diff --git a/zh/blog/tag/distill/index.html b/zh/blog/tag/distill/index.html index 41988b8a6d6f..35042ca83bfd 100644 --- a/zh/blog/tag/distill/index.html +++ b/zh/blog/tag/distill/index.html @@ -1 +1 @@ - distill | X - LANCE

                                  distill

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file + distill | X - LANCE

                                  distill

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file diff --git a/zh/blog/tag/formatting/index.html b/zh/blog/tag/formatting/index.html index 1bce4465cec7..4846cc449d7a 100644 --- a/zh/blog/tag/formatting/index.html +++ b/zh/blog/tag/formatting/index.html @@ -1 +1 @@ - formatting | X - LANCE

                                  formatting

                                  带有此标签的文章存档

                                  2024年 1月 27日 a post with code diff
                                  2024年 1月 27日 a post with advanced image components
                                  2024年 1月 27日 a post with vega lite
                                  2024年 1月 26日 a post with geojson
                                  2024年 1月 26日 a post with echarts
                                  2024年 1月 26日 a post with chart.js
                                  2023年 12月 12日 a post with TikZJax
                                  2023年 7月 12日 a post with bibliography
                                  2023年 7月 04日 a post with jupyter notebook
                                  2023年 5月 12日 a post with custom blockquotes
                                  2023年 4月 25日 a post with table of contents on a sidebar
                                  2023年 4月 25日 a post with audios
                                  2023年 4月 24日 a post with videos
                                  2023年 3月 20日 displaying beautiful tables with Bootstrap Tables
                                  2023年 3月 20日 a post with table of contents
                                  2021年 7月 04日 a post with diagrams
                                  2020年 9月 28日 a post with twitter
                                  2018年 12月 22日 a distill-style blog post
                                  2015年 10月 20日 a post with math
                                  2015年 7月 15日 a post with code
                                  2015年 5月 15日 a post with images
                                  2015年 3月 15日 a post with formatting and links
                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file + formatting | X - LANCE

                                  formatting

                                  带有此标签的文章存档

                                  2024年 1月 27日 a post with code diff
                                  2024年 1月 27日 a post with advanced image components
                                  2024年 1月 27日 a post with vega lite
                                  2024年 1月 26日 a post with geojson
                                  2024年 1月 26日 a post with echarts
                                  2024年 1月 26日 a post with chart.js
                                  2023年 12月 12日 a post with TikZJax
                                  2023年 7月 12日 a post with bibliography
                                  2023年 7月 04日 a post with jupyter notebook
                                  2023年 5月 12日 a post with custom blockquotes
                                  2023年 4月 25日 a post with table of contents on a sidebar
                                  2023年 4月 25日 a post with audios
                                  2023年 4月 24日 a post with videos
                                  2023年 3月 20日 displaying beautiful tables with Bootstrap Tables
                                  2023年 3月 20日 a post with table of contents
                                  2021年 7月 04日 a post with diagrams
                                  2020年 9月 28日 a post with twitter
                                  2018年 12月 22日 a distill-style blog post
                                  2015年 10月 20日 a post with math
                                  2015年 7月 15日 a post with code
                                  2015年 5月 15日 a post with images
                                  2015年 3月 15日 a post with formatting and links
                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file diff --git a/zh/blog/tag/images/index.html b/zh/blog/tag/images/index.html index d056a4c87086..4cf6e3dd8d06 100644 --- a/zh/blog/tag/images/index.html +++ b/zh/blog/tag/images/index.html @@ -1 +1 @@ - images | X - LANCE

                                  images

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file + images | X - LANCE

                                  images

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file diff --git a/zh/blog/tag/jupyter/index.html b/zh/blog/tag/jupyter/index.html index f761ef296eb5..358cdffc0f23 100644 --- a/zh/blog/tag/jupyter/index.html +++ b/zh/blog/tag/jupyter/index.html @@ -1 +1 @@ - jupyter | X - LANCE

                                  jupyter

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file + jupyter | X - LANCE

                                  jupyter

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file diff --git a/zh/blog/tag/links/index.html b/zh/blog/tag/links/index.html index 2bbebe42d7df..8027927546eb 100644 --- a/zh/blog/tag/links/index.html +++ b/zh/blog/tag/links/index.html @@ -1 +1 @@ - links | X - LANCE

                                  links

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file + links | X - LANCE

                                  links

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file diff --git a/zh/blog/tag/maps/index.html b/zh/blog/tag/maps/index.html index 6cf3e078063e..6075a058218f 100644 --- a/zh/blog/tag/maps/index.html +++ b/zh/blog/tag/maps/index.html @@ -1 +1 @@ - maps | X - LANCE

                                  maps

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file + maps | X - LANCE

                                  maps

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file diff --git a/zh/blog/tag/math/index.html b/zh/blog/tag/math/index.html index 965858191f83..3a4f2661d386 100644 --- a/zh/blog/tag/math/index.html +++ b/zh/blog/tag/math/index.html @@ -1 +1 @@ - math | X - LANCE

                                  math

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file + math | X - LANCE

                                  math

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file diff --git a/zh/blog/tag/metadata/index.html b/zh/blog/tag/metadata/index.html index 12ff426fc418..b85f972cf83d 100644 --- a/zh/blog/tag/metadata/index.html +++ b/zh/blog/tag/metadata/index.html @@ -1 +1 @@ - metadata | X - LANCE

                                  metadata

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file + metadata | X - LANCE

                                  metadata

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file diff --git a/zh/blog/tag/sidebar/index.html b/zh/blog/tag/sidebar/index.html index 2277a305734f..75572c99020e 100644 --- a/zh/blog/tag/sidebar/index.html +++ b/zh/blog/tag/sidebar/index.html @@ -1 +1 @@ - sidebar | X - LANCE

                                  sidebar

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file + sidebar | X - LANCE

                                  sidebar

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file diff --git a/zh/blog/tag/tables/index.html b/zh/blog/tag/tables/index.html index 0dbf276f655a..9d6acca8385e 100644 --- a/zh/blog/tag/tables/index.html +++ b/zh/blog/tag/tables/index.html @@ -1 +1 @@ - tables | X - LANCE

                                  tables

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file + tables | X - LANCE

                                  tables

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file diff --git a/zh/blog/tag/toc/index.html b/zh/blog/tag/toc/index.html index c4f818b6363d..0536c9cae3ff 100644 --- a/zh/blog/tag/toc/index.html +++ b/zh/blog/tag/toc/index.html @@ -1 +1 @@ - toc | X - LANCE

                                  toc

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file + toc | X - LANCE

                                  toc

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file diff --git a/zh/blog/tag/videos/index.html b/zh/blog/tag/videos/index.html index 68cab4124a2f..5fc424b89352 100644 --- a/zh/blog/tag/videos/index.html +++ b/zh/blog/tag/videos/index.html @@ -1 +1 @@ - videos | X - LANCE

                                  videos

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file + videos | X - LANCE

                                  videos

                                  带有此标签的文章存档

                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file diff --git a/zh/cv/index.html b/zh/cv/index.html index 4c9fd09fbac3..a98928128f06 100644 --- a/zh/cv/index.html +++ b/zh/cv/index.html @@ -1 +1 @@ - cv | X - LANCE

                                  cv

                                  This is a description of the page. You can modify it in '_pages/cv.md'. You can also change or remove the top pdf download button.

                                  Informações Gerais

                                  Nome Completo Albert Einstein
                                  Data de Nascimento 14 de março de 1879
                                  Idiomas Inglês, Alemão

                                  Educação

                                  • 1905
                                    PhD
                                    University of Zurich, Zurique, Suíça
                                    • Descrição 1.
                                    • Descrição 2.
                                    • Descrição 3.
                                      • Sub-descrição 1.
                                      • Sub-descrição 2.
                                  • 1900
                                    Diploma de ensino federal
                                    Eidgenössische Technische Hochschule, Zurique, Suíça
                                    • Descrição 1.
                                    • Descrição 2.

                                  Experiência

                                  • 1933 - 1955
                                    Professor de Física Teórica
                                    Institute for Advanced Study, Princeton University
                                    • Descrição 1.
                                    • Descrição 2.
                                    • Descrição 3.
                                      • Sub-descrição 1.
                                      • Sub-descrição 2.
                                  • 1933
                                    Professor Visitante
                                    California Institute of Technology, Pasadena, Califórnia, EUA
                                    • Descrição 1.
                                    • Descrição 2.
                                  • 1917-1933
                                    Diretor
                                    Kaiser Wilhelm Institute for Physics, Berlim, Alemanha.
                                  • 1911 - 1917
                                    Professor de Física Teórica
                                    Karl-Ferdinand University, Praga, Tchecoslováquia
                                  • 1909 - 1911
                                    Professor Associado de Física Teórica
                                    University of Zurich, Zurique, Suíça

                                  Projetos de Código Aberto

                                  • 2023-atual
                                    multi-language-al-folio
                                    • Uma variação do tema al-folio com suporte a múltiplos idiomas.
                                  • 2015-atual
                                    al-folio
                                    • Um tema Jekyll bonito, simples, limpo e responsivo para acadêmicos.

                                  Honrarias e Prêmios

                                  • 1921
                                    • Prêmio Nobel de Física
                                    • Medalha Matteucci
                                  • 2029
                                    • Medalha Max Planck

                                  Interesses Acadêmicos

                                  • Tópico 1.
                                    • Descrição 1.
                                    • Descrição 2.
                                  • Tópico 2.
                                    • Descrição 1.
                                    • Descrição 2.

                                  Outros Interesses

                                  • Hobbies: Hobby 1, Hobby 2, etc.
                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file + cv | X - LANCE

                                  cv

                                  This is a description of the page. You can modify it in '_pages/cv.md'. You can also change or remove the top pdf download button.

                                  Informações Gerais

                                  Nome Completo Albert Einstein
                                  Data de Nascimento 14 de março de 1879
                                  Idiomas Inglês, Alemão

                                  Educação

                                  • 1905
                                    PhD
                                    University of Zurich, Zurique, Suíça
                                    • Descrição 1.
                                    • Descrição 2.
                                    • Descrição 3.
                                      • Sub-descrição 1.
                                      • Sub-descrição 2.
                                  • 1900
                                    Diploma de ensino federal
                                    Eidgenössische Technische Hochschule, Zurique, Suíça
                                    • Descrição 1.
                                    • Descrição 2.

                                  Experiência

                                  • 1933 - 1955
                                    Professor de Física Teórica
                                    Institute for Advanced Study, Princeton University
                                    • Descrição 1.
                                    • Descrição 2.
                                    • Descrição 3.
                                      • Sub-descrição 1.
                                      • Sub-descrição 2.
                                  • 1933
                                    Professor Visitante
                                    California Institute of Technology, Pasadena, Califórnia, EUA
                                    • Descrição 1.
                                    • Descrição 2.
                                  • 1917-1933
                                    Diretor
                                    Kaiser Wilhelm Institute for Physics, Berlim, Alemanha.
                                  • 1911 - 1917
                                    Professor de Física Teórica
                                    Karl-Ferdinand University, Praga, Tchecoslováquia
                                  • 1909 - 1911
                                    Professor Associado de Física Teórica
                                    University of Zurich, Zurique, Suíça

                                  Projetos de Código Aberto

                                  • 2023-atual
                                    multi-language-al-folio
                                    • Uma variação do tema al-folio com suporte a múltiplos idiomas.
                                  • 2015-atual
                                    al-folio
                                    • Um tema Jekyll bonito, simples, limpo e responsivo para acadêmicos.

                                  Honrarias e Prêmios

                                  • 1921
                                    • Prêmio Nobel de Física
                                    • Medalha Matteucci
                                  • 2029
                                    • Medalha Max Planck

                                  Interesses Acadêmicos

                                  • Tópico 1.
                                    • Descrição 1.
                                    • Descrição 2.
                                  • Tópico 2.
                                    • Descrição 1.
                                    • Descrição 2.

                                  Outros Interesses

                                  • Hobbies: Hobby 1, Hobby 2, etc.
                                  © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                  \ No newline at end of file diff --git a/zh/feed.xml b/zh/feed.xml index 7a24ef2af4d1..2d0e21f98bc9 100644 --- a/zh/feed.xml +++ b/zh/feed.xml @@ -1,4 +1,4 @@ -Jekyll2024-05-26T02:45:34+00:00https://x-lance.github.io/feed.xmlblanka post with code diff2024-01-27T19:22:00+00:002024-01-27T19:22:00+00:00https://x-lance.github.io/blog/2024/code-diffYou can display diff code by using the regular markdown syntax:

                                  ```diff
                                  +Jekyll2024-05-26T02:56:08+00:00https://x-lance.github.io/feed.xmlblanka post with code diff2024-01-27T19:22:00+00:002024-01-27T19:22:00+00:00https://x-lance.github.io/blog/2024/code-diffYou can display diff code by using the regular markdown syntax:

                                  ```diff
                                   diff --git a/sample.js b/sample.js
                                   index 0000001..0ddf2ba
                                   --- a/sample.js
                                  diff --git a/zh/index.html b/zh/index.html
                                  index d4539e072969..9ffebf3bcfd1 100644
                                  --- a/zh/index.html
                                  +++ b/zh/index.html
                                  @@ -1 +1 @@
                                  -        X - LANCE                  

                                  X - LANCE

                                  上海交通大学 跨媒体语言智能实验室

                                  logo_red_clipped.png

                                  电院3号楼223、225
                                  上海交通大学
                                  上海,闵行
                                  xlance@sjtu.edu.cn

                                  欢迎访问上海交通大学 X-LANCE 实验室!

                                  上海交通大学跨媒体语言智能实验室(SJTU Cross Media Language Intelligence Lab, X-LANCE)成立于2012年,前身是“智能语音实验室”(SpeechLab),经过多年发展,成为了涵盖视听文语言信息处理核心各研究领域的“跨模态语言智能实验室”。目前,跨媒体语言智能实验室的教师组有一位教授、四位副教授和一位科研助理,拥有十九名博士研究生,三十六名硕士研究生,还包括ACM班、AI班、IEEE班、电院CS等专业、巴黎卓越工程师学院、密西根学院等的三十余名本科生。

                                  实验室获得了包括国家重点研发计划、自然科学基金委优秀青年科学基金在内的诸多国家和企业项目支持。实验室与思必驰科技股份有限公司深度合作,成立了“上海交通大学思必驰智能人机交互联合实验室”。实验室可调动丰富的数据资源以及多达数百块H800、A800、A10等GPU卡的丰富计算资源,是国际上极少数可以进行产业级大尺度数据分析和研究的人工智能实验室之一。

                                  X-LANCE实验室致力于做能够改变世界的国际水平的技术研究,实验室的学术信条:要用技术改变世界,首先必须是一个优秀的工程师;而一个杰出的工程师一定是一位科学家。

                                  🔥新闻

                                  2024年 5月 18日 🌄【博士生大组会】 2024年度博士生大组会在浙江安吉举行。 【公众号推送】
                                  2024年 5月 02日 📃【论文+3】X-LANCE 实验室的三篇论文被 ACL 2024 主会或Findings接收。 【公众号推送】
                                  2024年 5月 02日 📃【论文+2】X-LANCE 实验室的两篇论文被 ICML 2024 接收。 【公众号推送】

                                  📑论文摘选

                                    © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                    \ No newline at end of file + X - LANCE

                                    X - LANCE

                                    上海交通大学 跨媒体语言智能实验室

                                    logo_red_clipped.png

                                    电院3号楼223、225
                                    上海交通大学
                                    上海,闵行
                                    xlance@sjtu.edu.cn

                                    欢迎访问上海交通大学 X-LANCE 实验室!

                                    上海交通大学跨媒体语言智能实验室(SJTU Cross Media Language Intelligence Lab, X-LANCE)成立于2012年,前身是“智能语音实验室”(SpeechLab),经过多年发展,成为了涵盖视听文语言信息处理核心各研究领域的“跨模态语言智能实验室”。目前,跨媒体语言智能实验室的教师组有一位教授、四位副教授和一位科研助理,拥有十九名博士研究生,三十六名硕士研究生,还包括ACM班、AI班、IEEE班、电院CS等专业、巴黎卓越工程师学院、密西根学院等的三十余名本科生。

                                    实验室获得了包括国家重点研发计划、自然科学基金委优秀青年科学基金在内的诸多国家和企业项目支持。实验室与思必驰科技股份有限公司深度合作,成立了“上海交通大学思必驰智能人机交互联合实验室”。实验室可调动丰富的数据资源以及多达数百块H800、A800、A10等GPU卡的丰富计算资源,是国际上极少数可以进行产业级大尺度数据分析和研究的人工智能实验室之一。

                                    X-LANCE实验室致力于做能够改变世界的国际水平的技术研究,实验室的学术信条:要用技术改变世界,首先必须是一个优秀的工程师;而一个杰出的工程师一定是一位科学家。

                                    🔥新闻

                                    2024年 5月 18日 🌄【博士生大组会】 2024年度博士生大组会在浙江安吉举行。 【公众号推送】
                                    2024年 5月 02日 📃【论文+3】X-LANCE 实验室的三篇论文被 ACL 2024 主会或Findings接收。 【公众号推送】
                                    2024年 5月 02日 📃【论文+2】X-LANCE 实验室的两篇论文被 ICML 2024 接收。 【公众号推送】

                                    📑论文摘选

                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file diff --git a/zh/members/alumni/index.html b/zh/members/alumni/index.html index 7f04bafaa71a..5b263a92c603 100644 --- a/zh/members/alumni/index.html +++ b/zh/members/alumni/index.html @@ -1 +1 @@ - 校友 | X - LANCE

                                      校友

                                      X-LANCE校友


                                      members/faculty/qym_square.jpg

                                      钱彦旻 教授

                                      电院3号楼501
                                      qian-ym@sjtu.edu.cn

                                      钱彦旻,上海交通大学计算机科学与工程系教授,博士生导师。清华大学博士,英国剑桥大学工程系博士后。国家级高层次人才,国家优秀青年基金、吴文俊人工智能自然科学奖一等奖(第一完成人)获得者。现为IEEE高级会员、ISCA会员,同时也是国际开源项目Kaldi语音识别工具包的13位创始成员之一。担任InterSpeech, ISCSLP等国际会议的领域主席和TPC委员;IEEE T-ASLP, IEEE J-STSP, IEEE SPL, ICASSP, InterSpeech等期刊和国际会议审稿人。有10余年从事智能语音及语言处理、人机交互、模式识别及机器学习的研究和产业化工作经验。在本领域的一流国际期刊和会议上发表学术论文200余篇,Google Scholar引用总数12000余次,申请80余项中美专利,合作撰写和翻译多本外文书籍。3次获得领域内国际权威期刊和会议的最优论文奖,5次带队获得国际评测冠军。作为负责人和主要参与者参加了包括国家自然科学基金、国家脑科学计划、国家重点研发计划、国防JKW、国家863、英国EPSRC等多个项目。目前的研究领域包括:语音识别和语音翻译,说话人和语种识别,语音抗噪与分离,音乐生成和理解,语音情感感知,多模态和跨模态信息处理,自然语言理解,深度学习建模,多媒体信号处理等。

                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file + 校友 | X - LANCE

                                      校友

                                      X-LANCE校友


                                      members/faculty/qym_square.jpg

                                      钱彦旻 教授

                                      电院3号楼501
                                      qian-ym@sjtu.edu.cn

                                      钱彦旻,上海交通大学计算机科学与工程系教授,博士生导师。清华大学博士,英国剑桥大学工程系博士后。国家级高层次人才,国家优秀青年基金、吴文俊人工智能自然科学奖一等奖(第一完成人)获得者。现为IEEE高级会员、ISCA会员,同时也是国际开源项目Kaldi语音识别工具包的13位创始成员之一。担任InterSpeech, ISCSLP等国际会议的领域主席和TPC委员;IEEE T-ASLP, IEEE J-STSP, IEEE SPL, ICASSP, InterSpeech等期刊和国际会议审稿人。有10余年从事智能语音及语言处理、人机交互、模式识别及机器学习的研究和产业化工作经验。在本领域的一流国际期刊和会议上发表学术论文200余篇,Google Scholar引用总数12000余次,申请80余项中美专利,合作撰写和翻译多本外文书籍。3次获得领域内国际权威期刊和会议的最优论文奖,5次带队获得国际评测冠军。作为负责人和主要参与者参加了包括国家自然科学基金、国家脑科学计划、国家重点研发计划、国防JKW、国家863、英国EPSRC等多个项目。目前的研究领域包括:语音识别和语音翻译,说话人和语种识别,语音抗噪与分离,音乐生成和理解,语音情感感知,多模态和跨模态信息处理,自然语言理解,深度学习建模,多媒体信号处理等。

                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file diff --git a/zh/members/faculty/index.html b/zh/members/faculty/index.html index f35b782777ec..583c3507864a 100644 --- a/zh/members/faculty/index.html +++ b/zh/members/faculty/index.html @@ -1 +1 @@ - 教师 | X - LANCE

                                      教师


                                      members/faculty/ky_square.jpg

                                      俞凯 特聘教授

                                      电院3号楼539
                                      kai.yu@sjtu.edu.cn
                                      个人主页

                                      俞凯,现任上海交通大学计算机科学与工程系特聘教授、博导,思必驰公司联合创始人、首席科学家。国家“万人计划”科技创新领军人才,曾获国家自然科学基金委青年优青、上海市“东方学者”特聘教授。清华大学自动化系本科、硕士,英国剑桥大学工程系博士。长期从事人工智能领域的智能语音及语言处理、人机交互、模式识别及机器学习的研究和产业化工作。在语音识别及合成、自然语言理解 、口语对话系统、认知型人机交互等方面取得了一系列国际先进的研究、工程和产业化成果。在国际一流会议和期刊发表论文200余篇,获得Computer Speech and Language,Speech Communication 等顶级期刊最优论文奖和InterSpeech等多个顶级国际会议优秀论文奖,在语音识别、对话系统等一系列国际评测中获得冠军。他是国际电子电气工程师协会(IEEE)高级会员,中国大陆高校首个IEEE Speech and Language Processing Technical Committee 委员(2017-2019),IEEE Transactions on Audio Speech and Language Processing 副主编,曾任InterSpeech等国际会议程序委员会主席,ACL、EMNLP等国际会议研究领域主席。


                                      members/faculty/slp_square.jpg

                                      申丽萍 副教授

                                      电院3号楼531
                                      lpshen@sjtu.edu.cn
                                      个人主页

                                      申丽萍,博士,副教授,交大e-Learning实验室负责人。自2001年起为全国信息技术标准化技术委员会教育技术分技术委员会委员,获委员会“20周年卓越贡献奖”。曾任SCI期刊Journal of Ambient Intelligence and Smart Environments编辑。研究领域主要集中在自适应学习技术、情感计算与学习数据分析。主持多项自然科学基金项目和科技支撑项目。近年来在国内外期刊和会议上发表论文三十余篇,其中论文“Affective eLearning: Utilizing Emotion Data to Improve Learning in the Pervasive Environment”获2016年上海CCF普适计算与嵌入式分委员会最佳英文论文奖,该论文谷歌学术中显示被引达500多次。同时已授权专利1个,负责起草已发布国家标准4个,参与起草已发布国际标准2个。是教育通用人工智能大模型系列标准的联合召集人,上海市人工智能技术协会标准人工智能大模型系列标准的主要起草人之一。


                                      members/faculty/cx_square.jpg

                                      陈谐 副教授

                                      SEIEE 3-501
                                      chenxie95@sjtu.edu.cn
                                      个人主页

                                      陈谐,上海交通大学计算机科学与工程系副教授。国家级高层次人才工程获得者。厦门大学本科,清华大学硕士,剑桥大学博士,博士毕业后在剑桥大学从事博士后研究。美国微软语音与语言研究组任高级研究员和资深研究员。主要研究方向是深度学习和智能语音信号处理,如语音识别,语音合成和基于语音的自监督学习。在语音主流会议ICASSP, InterSpeech, ASRU和期刊IEEE/ACM, TASLP发表论文50余篇。


                                      members/faculty/wmy_square.jpg

                                      吴梦玥 副研究员

                                      SEIEE 3-524
                                      mengyuewu@sjtu.edu.cn
                                      个人主页

                                      吴梦玥,上海交通大学计算机科学与工程系副教授,博士生导师,澳大利亚墨尔本大学博士。上海市浦江人才获得者。中国计算机学会语音对话及听觉专业委员会委员。长期从事多媒体信息研究的工作,研究兴趣主要为丰富音频信息感知、自然语言处理、以及多模态融合技术在医疗领域的应用,包括精神卫生、公共卫生以及相关健康声学大数据研究。率先提出音频-文本摘要任务,成为丰富音频领域新的旗舰任务。在ICASSP、Interspeech、Multimedia、IEEE/ACM T-ASLP等智能音频处理及多媒体重要会议和期刊上发表论文50余篇。作为负责人和参与者承担多项国家自然科学基金青年、面上、重大研究计划等项目。


                                      members/faculty/cl_square.jpg

                                      陈露 副研究员

                                      SEIEE 3-223
                                      chenlusz@sjtu.edu.cn
                                      个人主页

                                      陈露,上海交通大学计算机科学与工程系副研究员。主要研究兴趣包括类ChatGPT对话式大语言模型、自然语言处理、AI for Science等。目前已在TPAMI、NeurIPS、ACL等重要国际会议和期刊上发表论文40余篇,研究成果获自然语言处理权威国际会议COLING2018领域主席推荐奖、第十七届全国人机语音通讯学术会议(NCMMSC2022)最佳论文奖、2020年上海交通大学优博奖、2021年中国计算机学会(CCF)优博提名奖、2021年ACM中国(上海分会)优博奖。曾多次带领团队参加国内外智能人机对话与智能问答方向权威挑战赛/技术评测(包括DSTC、Spider、CSpider、CBLUE2.0等)并获得冠军或第一名。其部分研究成果通过产学研合作获得大规模推广应用,转化专利获得第二十三届中国专利奖优秀奖。他还担任国际计算语言学协会滚动审稿机制(ACL ARR)领域主席、自然语言处理顶级期刊TACL常设审稿人(Standing Reviewer),多次担任ICML/NeurIPS/ACL/EMNLP等重要国际学术会议的程序委员会委员。

                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file + 教师 | X - LANCE

                                      教师


                                      members/faculty/ky_square.jpg

                                      俞凯 特聘教授

                                      电院3号楼539
                                      kai.yu@sjtu.edu.cn
                                      个人主页

                                      俞凯,现任上海交通大学计算机科学与工程系特聘教授、博导,思必驰公司联合创始人、首席科学家。国家“万人计划”科技创新领军人才,曾获国家自然科学基金委青年优青、上海市“东方学者”特聘教授。清华大学自动化系本科、硕士,英国剑桥大学工程系博士。长期从事人工智能领域的智能语音及语言处理、人机交互、模式识别及机器学习的研究和产业化工作。在语音识别及合成、自然语言理解 、口语对话系统、认知型人机交互等方面取得了一系列国际先进的研究、工程和产业化成果。在国际一流会议和期刊发表论文200余篇,获得Computer Speech and Language,Speech Communication 等顶级期刊最优论文奖和InterSpeech等多个顶级国际会议优秀论文奖,在语音识别、对话系统等一系列国际评测中获得冠军。他是国际电子电气工程师协会(IEEE)高级会员,中国大陆高校首个IEEE Speech and Language Processing Technical Committee 委员(2017-2019),IEEE Transactions on Audio Speech and Language Processing 副主编,曾任InterSpeech等国际会议程序委员会主席,ACL、EMNLP等国际会议研究领域主席。


                                      members/faculty/slp_square.jpg

                                      申丽萍 副教授

                                      电院3号楼531
                                      lpshen@sjtu.edu.cn
                                      个人主页

                                      申丽萍,博士,副教授,交大e-Learning实验室负责人。自2001年起为全国信息技术标准化技术委员会教育技术分技术委员会委员,获委员会“20周年卓越贡献奖”。曾任SCI期刊Journal of Ambient Intelligence and Smart Environments编辑。研究领域主要集中在自适应学习技术、情感计算与学习数据分析。主持多项自然科学基金项目和科技支撑项目。近年来在国内外期刊和会议上发表论文三十余篇,其中论文“Affective eLearning: Utilizing Emotion Data to Improve Learning in the Pervasive Environment”获2016年上海CCF普适计算与嵌入式分委员会最佳英文论文奖,该论文谷歌学术中显示被引达500多次。同时已授权专利1个,负责起草已发布国家标准4个,参与起草已发布国际标准2个。是教育通用人工智能大模型系列标准的联合召集人,上海市人工智能技术协会标准人工智能大模型系列标准的主要起草人之一。


                                      members/faculty/cx_square.jpg

                                      陈谐 副教授

                                      SEIEE 3-501
                                      chenxie95@sjtu.edu.cn
                                      个人主页

                                      陈谐,上海交通大学计算机科学与工程系副教授。国家级高层次人才工程获得者。厦门大学本科,清华大学硕士,剑桥大学博士,博士毕业后在剑桥大学从事博士后研究。美国微软语音与语言研究组任高级研究员和资深研究员。主要研究方向是深度学习和智能语音信号处理,如语音识别,语音合成和基于语音的自监督学习。在语音主流会议ICASSP, InterSpeech, ASRU和期刊IEEE/ACM, TASLP发表论文50余篇。


                                      members/faculty/wmy_square.jpg

                                      吴梦玥 副研究员

                                      SEIEE 3-524
                                      mengyuewu@sjtu.edu.cn
                                      个人主页

                                      吴梦玥,上海交通大学计算机科学与工程系副教授,博士生导师,澳大利亚墨尔本大学博士。上海市浦江人才获得者。中国计算机学会语音对话及听觉专业委员会委员。长期从事多媒体信息研究的工作,研究兴趣主要为丰富音频信息感知、自然语言处理、以及多模态融合技术在医疗领域的应用,包括精神卫生、公共卫生以及相关健康声学大数据研究。率先提出音频-文本摘要任务,成为丰富音频领域新的旗舰任务。在ICASSP、Interspeech、Multimedia、IEEE/ACM T-ASLP等智能音频处理及多媒体重要会议和期刊上发表论文50余篇。作为负责人和参与者承担多项国家自然科学基金青年、面上、重大研究计划等项目。


                                      members/faculty/cl_square.jpg

                                      陈露 副研究员

                                      SEIEE 3-223
                                      chenlusz@sjtu.edu.cn
                                      个人主页

                                      陈露,上海交通大学计算机科学与工程系副研究员。主要研究兴趣包括类ChatGPT对话式大语言模型、自然语言处理、AI for Science等。目前已在TPAMI、NeurIPS、ACL等重要国际会议和期刊上发表论文40余篇,研究成果获自然语言处理权威国际会议COLING2018领域主席推荐奖、第十七届全国人机语音通讯学术会议(NCMMSC2022)最佳论文奖、2020年上海交通大学优博奖、2021年中国计算机学会(CCF)优博提名奖、2021年ACM中国(上海分会)优博奖。曾多次带领团队参加国内外智能人机对话与智能问答方向权威挑战赛/技术评测(包括DSTC、Spider、CSpider、CBLUE2.0等)并获得冠军或第一名。其部分研究成果通过产学研合作获得大规模推广应用,转化专利获得第二十三届中国专利奖优秀奖。他还担任国际计算语言学协会滚动审稿机制(ACL ARR)领域主席、自然语言处理顶级期刊TACL常设审稿人(Standing Reviewer),多次担任ICML/NeurIPS/ACL/EMNLP等重要国际学术会议的程序委员会委员。

                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file diff --git a/zh/members/student/index.html b/zh/members/student/index.html index ba9b31858ca2..22ca08c3dd74 100644 --- a/zh/members/student/index.html +++ b/zh/members/student/index.html @@ -1 +1 @@ - Students | X - LANCE

                                      Students

                                      Students of X-LANCE

                                      博士后

                                      博士研究生

                                      杜晨鹏
                                      078-P
                                      许洪深
                                      091-P
                                      赵梓涵
                                      106-P
                                      张丹阳
                                      112-P
                                      奚彧
                                      107-P
                                      徐薛楠
                                      098-M
                                      刘涛
                                      129-P
                                      曹瑞升
                                      084-M
                                      马子阳
                                      151-P
                                      马达
                                      094-M
                                      张思拓
                                      140-P
                                      王翰坤
                                      150-P
                                      刘浚哲
                                      160-P
                                      朱梓臣
                                      146-UP
                                      杨亦凡
                                      171-P
                                      王鹏宇
                                      145-P
                                      兰焜耀
                                      131-MP
                                      韩杨
                                      166-P
                                      郭奕玮
                                      158-P
                                      罗嘉鸣
                                      147-P
                                      宋秀杰
                                      164-P

                                      硕士研究生

                                      刘韫聪
                                      133-P
                                      黄甘雨
                                      卓建衡
                                      148-M
                                      张晗翀
                                      165-M
                                      谢泽宇
                                      138-U
                                      宋哲书
                                      154-M
                                      孙良泰
                                      170-M
                                      李翰奇
                                      169-M
                                      黎井漂
                                      168-M
                                      何朝帆
                                      172-M
                                      陈禹伸
                                      陈思远
                                      149-M
                                      曾泓川
                                      杨冠柔
                                      153-M
                                      杨飞
                                      徐晓航
                                      139-M
                                      肖云冲
                                      162-M
                                      宋雅昆
                                      彭阅章
                                      罗逸杰
                                      卢葛威
                                      143-M
                                      李俊杰
                                      152-M
                                      李浩宇
                                      159-M
                                      韩森宇
                                      167-M
                                      李星源
                                      172-M
                                      张耀匀

                                      本科生

                                      李柏涵
                                      157-U
                                      张杭磊
                                      王辰润
                                      张熙灼
                                      陈宝才
                                      申振南
                                      陈琦
                                      142-U
                                      张耀中
                                      陈文熙
                                      杨晨
                                      141-U
                                      郑之胜
                                      朱彦桥
                                      郑航
                                      牛志康
                                      罗丹宇
                                      144-U
                                      郑棋曦
                                      李波含
                                      刘轩丞
                                      李之涵
                                      梁宇哲
                                      陈逸恒
                                      夏钲舜
                                      周鼎
                                      李希泉
                                      舒欣茗
                                      姜皓翔
                                      徐瑞阳
                                      张一凡
                                      郭思佳
                                      靳秉睿
                                      万恬溪
                                      王熠笑
                                      文雯
                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file + Students | X - LANCE

                                      Students

                                      Students of X-LANCE

                                      博士研究生

                                      杜晨鹏
                                      078-P
                                      许洪深
                                      091-P
                                      赵梓涵
                                      106-P
                                      张丹阳
                                      112-P
                                      奚彧
                                      107-P
                                      徐薛楠
                                      098-M
                                      刘涛
                                      129-P
                                      曹瑞升
                                      084-M
                                      马子阳
                                      151-P
                                      马达
                                      094-M
                                      张思拓
                                      140-P
                                      王翰坤
                                      150-P
                                      刘浚哲
                                      160-P
                                      朱梓臣
                                      146-UP
                                      杨亦凡
                                      171-P
                                      王鹏宇
                                      145-P
                                      兰焜耀
                                      131-MP
                                      韩杨
                                      166-P
                                      郭奕玮
                                      158-P
                                      罗嘉鸣
                                      147-P
                                      宋秀杰
                                      164-P

                                      硕士研究生

                                      刘韫聪
                                      133-P
                                      黄甘雨
                                      卓建衡
                                      148-M
                                      张晗翀
                                      165-M
                                      谢泽宇
                                      138-U
                                      宋哲书
                                      154-M
                                      孙良泰
                                      170-M
                                      李翰奇
                                      169-M
                                      黎井漂
                                      168-M
                                      何朝帆
                                      172-M
                                      陈禹伸
                                      陈思远
                                      149-M
                                      曾泓川
                                      杨冠柔
                                      153-M
                                      杨飞
                                      徐晓航
                                      139-M
                                      肖云冲
                                      162-M
                                      宋雅昆
                                      彭阅章
                                      罗逸杰
                                      卢葛威
                                      143-M
                                      李俊杰
                                      152-M
                                      李浩宇
                                      159-M
                                      韩森宇
                                      167-M
                                      李星源
                                      172-M
                                      张耀匀

                                      本科生

                                      李柏涵
                                      157-U
                                      张杭磊
                                      王辰润
                                      张熙灼
                                      陈宝才
                                      申振南
                                      陈琦
                                      142-U
                                      张耀中
                                      陈文熙
                                      杨晨
                                      141-U
                                      郑之胜
                                      朱彦桥
                                      郑航
                                      牛志康
                                      罗丹宇
                                      144-U
                                      郑棋曦
                                      李波含
                                      刘轩丞
                                      李之涵
                                      梁宇哲
                                      陈逸恒
                                      夏钲舜
                                      周鼎
                                      李希泉
                                      舒欣茗
                                      姜皓翔
                                      徐瑞阳
                                      张一凡
                                      郭思佳
                                      靳秉睿
                                      万恬溪
                                      王熠笑
                                      文雯
                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file diff --git a/zh/news/announcement_1/index.html b/zh/news/announcement_1/index.html index 435cf182b96e..e81f34cf90aa 100644 --- a/zh/news/announcement_1/index.html +++ b/zh/news/announcement_1/index.html @@ -1 +1 @@ - Announcement_1 | X - LANCE

                                      Announcement_1

                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file + Announcement_1 | X - LANCE

                                      Announcement_1

                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file diff --git a/zh/news/announcement_2/index.html b/zh/news/announcement_2/index.html index a49efa4fa307..1749ff3bf663 100644 --- a/zh/news/announcement_2/index.html +++ b/zh/news/announcement_2/index.html @@ -1 +1 @@ - Announcement_2 | X - LANCE

                                      Announcement_2

                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file + Announcement_2 | X - LANCE

                                      Announcement_2

                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file diff --git a/zh/news/announcement_3/index.html b/zh/news/announcement_3/index.html index 3cbbae4e7a77..33c09c841e8a 100644 --- a/zh/news/announcement_3/index.html +++ b/zh/news/announcement_3/index.html @@ -1 +1 @@ - Announcement_3 | X - LANCE

                                      Announcement_3

                                      📃【论文+3】X-LANCE 实验室的三篇论文被 COLING 2024WSDM 2024 接收。 【公众号推送】

                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file + Announcement_3 | X - LANCE

                                      Announcement_3

                                      📃【论文+3】X-LANCE 实验室的三篇论文被 COLING 2024WSDM 2024 接收。 【公众号推送】

                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file diff --git a/zh/news/announcement_4/index.html b/zh/news/announcement_4/index.html index 2b5d1ae5e711..5391bd72d345 100644 --- a/zh/news/announcement_4/index.html +++ b/zh/news/announcement_4/index.html @@ -1 +1 @@ - Announcement_4 | X - LANCE

                                      Announcement_4

                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file + Announcement_4 | X - LANCE

                                      Announcement_4

                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file diff --git a/zh/news/announcement_5/index.html b/zh/news/announcement_5/index.html index 9a8d2037523c..a78722be80f2 100644 --- a/zh/news/announcement_5/index.html +++ b/zh/news/announcement_5/index.html @@ -1 +1 @@ - Announcement_5 | X - LANCE

                                      Announcement_5

                                      🎆【年度贺词】 共贺新春!上海交通大学跨媒体语音智能实验室2024年夜饭顺利举行。 【公众号推送】

                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file + Announcement_5 | X - LANCE

                                      Announcement_5

                                      🎆【年度贺词】 共贺新春!上海交通大学跨媒体语音智能实验室2024年夜饭顺利举行。 【公众号推送】

                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file diff --git a/zh/news/announcement_6/index.html b/zh/news/announcement_6/index.html index 0b58ab3392df..7bfa171589b2 100644 --- a/zh/news/announcement_6/index.html +++ b/zh/news/announcement_6/index.html @@ -1 +1 @@ - Announcement_6 | X - LANCE

                                      Announcement_6

                                      🤗【大模型+1】上海交通大学、思必驰、苏州实验室联合发布首个化学领域百亿级大模型,化学能力超GPT-4。 【公众号推送】

                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file + Announcement_6 | X - LANCE

                                      Announcement_6

                                      🤗【大模型+1】上海交通大学、思必驰、苏州实验室联合发布首个化学领域百亿级大模型,化学能力超GPT-4。 【公众号推送】

                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file diff --git a/zh/news/announcement_7/index.html b/zh/news/announcement_7/index.html index 9a3d1a48b02f..d06d7dfa4858 100644 --- a/zh/news/announcement_7/index.html +++ b/zh/news/announcement_7/index.html @@ -1 +1 @@ - Announcement_7 | X - LANCE

                                      Announcement_7

                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file + Announcement_7 | X - LANCE

                                      Announcement_7

                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file diff --git a/zh/news/announcement_8/index.html b/zh/news/announcement_8/index.html index 12c5c2acfc2d..4456982c260e 100644 --- a/zh/news/announcement_8/index.html +++ b/zh/news/announcement_8/index.html @@ -1 +1 @@ - Announcement_8 | X - LANCE

                                      Announcement_8

                                      📃【论文+3】X-LANCE 实验室的三篇论文被 ACL 2024 主会或Findings接收。 【公众号推送】

                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file + Announcement_8 | X - LANCE

                                      Announcement_8

                                      📃【论文+3】X-LANCE 实验室的三篇论文被 ACL 2024 主会或Findings接收。 【公众号推送】

                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file diff --git a/zh/news/announcement_9/index.html b/zh/news/announcement_9/index.html index 60193b401870..31aa015784ba 100644 --- a/zh/news/announcement_9/index.html +++ b/zh/news/announcement_9/index.html @@ -1 +1 @@ - Announcement_9 | X - LANCE

                                      Announcement_9

                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file + Announcement_9 | X - LANCE

                                      Announcement_9

                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file diff --git a/zh/news/index.html b/zh/news/index.html index 0081be1f563a..7b5f1e80725a 100644 --- a/zh/news/index.html +++ b/zh/news/index.html @@ -1 +1 @@ - 🔥新闻 | X - LANCE

                                      🔥新闻

                                      2024年 5月 18日 🌄【博士生大组会】 2024年度博士生大组会在浙江安吉举行。 【公众号推送】
                                      2024年 5月 02日 📃【论文+3】X-LANCE 实验室的三篇论文被 ACL 2024 主会或Findings接收。 【公众号推送】
                                      2024年 5月 02日 📃【论文+2】X-LANCE 实验室的两篇论文被 ICML 2024 接收。 【公众号推送】
                                      2024年 4月 07日 🤗【大模型+1】上海交通大学、思必驰、苏州实验室联合发布首个化学领域百亿级大模型,化学能力超GPT-4。 【公众号推送】
                                      2024年 3月 14日 📃【论文+2】X-LANCE 实验室的两篇论文被 NAACL 2024 接收。 【公众号推送】
                                      2024年 2月 29日 📃【论文+3】X-LANCE 实验室的三篇论文被 COLING 2024WSDM 2024 接收。 【公众号推送】
                                      2024年 1月 24日 🎆【年度贺词】 共贺新春!上海交通大学跨媒体语音智能实验室2024年夜饭顺利举行。 【公众号推送】
                                      2023年 12月 31日 📃【论文+3】X-LANCE 实验室的三篇论文被 AAAI 2024 接收。 【公众号推送】
                                      2023年 12月 31日 📃【论文+14】X-LANCE 实验室的十四篇论文被 ICASSP 2024 接收。 【公众号推送1】 【公众号推送2】
                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file + 🔥新闻 | X - LANCE

                                      🔥新闻

                                      2024年 5月 18日 🌄【博士生大组会】 2024年度博士生大组会在浙江安吉举行。 【公众号推送】
                                      2024年 5月 02日 📃【论文+3】X-LANCE 实验室的三篇论文被 ACL 2024 主会或Findings接收。 【公众号推送】
                                      2024年 5月 02日 📃【论文+2】X-LANCE 实验室的两篇论文被 ICML 2024 接收。 【公众号推送】
                                      2024年 4月 07日 🤗【大模型+1】上海交通大学、思必驰、苏州实验室联合发布首个化学领域百亿级大模型,化学能力超GPT-4。 【公众号推送】
                                      2024年 3月 14日 📃【论文+2】X-LANCE 实验室的两篇论文被 NAACL 2024 接收。 【公众号推送】
                                      2024年 2月 29日 📃【论文+3】X-LANCE 实验室的三篇论文被 COLING 2024WSDM 2024 接收。 【公众号推送】
                                      2024年 1月 24日 🎆【年度贺词】 共贺新春!上海交通大学跨媒体语音智能实验室2024年夜饭顺利举行。 【公众号推送】
                                      2023年 12月 31日 📃【论文+3】X-LANCE 实验室的三篇论文被 AAAI 2024 接收。 【公众号推送】
                                      2023年 12月 31日 📃【论文+14】X-LANCE 实验室的十四篇论文被 ICASSP 2024 接收。 【公众号推送1】 【公众号推送2】
                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file diff --git a/zh/papers/index.html b/zh/papers/index.html index 7e452345c0a1..a881b810b113 100644 --- a/zh/papers/index.html +++ b/zh/papers/index.html @@ -1 +1 @@ - 📃论文 | X - LANCE

                                      📃论文

                                      论文按时间倒序列出。

                                      2024

                                      1. Advanced Long-Content Speech Recognition With Factorized Neural Transducer
                                        Xun Gong , Yu Wu , Jinyu Li , Shujie Liu , Rui Zhao , Xie Chen, and Yanmin Qian
                                        IEEE ACM Trans. Audio Speech Lang. Process., 2024
                                      2. EAT: Self-Supervised Pre-Training with Efficient Audio Transformer
                                        Wenxi Chen , Yuzhe Liang , Ziyang Ma , Zhisheng Zheng , and Xie Chen
                                        CoRR, 2024
                                      3. ELLA-V: Stable Neural Codec Language Modeling with Alignment-guided Sequence Reordering
                                        Yakun Song , Zhuo Chen , Xiaofei Wang , Ziyang Ma , and Xie Chen
                                        CoRR, 2024
                                      4. BAT: Learning to Reason about Spatial Sounds with Large Language Models
                                        Zhisheng Zheng , Puyuan Peng , Ziyang Ma , Xie Chen, Eunsol Choi , and David Harwath
                                        CoRR, 2024
                                      5. An Embarrassingly Simple Approach for LLM with Strong ASR Capacity
                                        Ziyang Ma , Guanrou Yang , Yifan Yang , Zhifu Gao , Jiaming Wang , Zhihao Du , Fan Yu , Qian Chen , Siqi Zheng , Shiliang Zhang , and Xie Chen
                                        CoRR, 2024
                                      6. Beyond the Status Quo: A Contemporary Survey of Advances and Challenges in Audio Captioning
                                        Xuenan Xu , Zeyu Xie , Mengyue Wu, and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., 2024
                                      7. Towards Weakly Supervised Text-to-Audio Grounding
                                        Xuenan Xu , Ziyang Ma , Mengyue Wu, and Kai Yu
                                        CoRR, 2024
                                      8. VALL-T: Decoder-Only Generative Transducer for Robust and Decoding-Controllable Text-to-Speech
                                        Chenpeng Du , Yiwei Guo , Hankun Wang , Yifan Yang , Zhikang Niu , Shuai Wang , Hui Zhang , Xie Chen, and Kai Yu
                                        CoRR, 2024
                                      9. ChemDFM: Dialogue Foundation Model for Chemistry
                                        Zihan Zhao , Da Ma , Lu Chen, Liangtai Sun , Zihao Li , Hongshen Xu , Zichen Zhu , Su Zhu , Shuai Fan , Guodong Shen , Xin Chen , and Kai Yu
                                        CoRR, 2024
                                      10. MULTI: Multimodal Understanding Leaderboard with Text and Images
                                        Zichen Zhu, Yang Xu , Lu Chen, Jingkai Yang , Yichuan Ma , Yiming Sun , Hailin Wen , Jiaqi Liu , Jinyu Cai , Yingzi Ma , Situo Zhang , Zihan Zhao , Liangtai Sun , and Kai Yu
                                        CoRR, 2024

                                      2023

                                      1. A Unified Framework From Face Image Restoration to Data Augmentation Using Generative Prior
                                        Jiawei You , Ganyu Huang , Tianyuan Han , Haoze Yang , and Liping Shen
                                        IEEE Access, 2023
                                      2. Human Pose Estimation with Combined Feature Maps and Joint Embeddings
                                        Tianyuan Han , Ganyu Huang , Chunhui Li , and Liping Shen
                                        In Proceedings of the 2023 International Conference on Advances in Artificial Intelligence and Applications, AAIA 2023, Wuhan, China, November 18-20, 2023 , 2023
                                      3. Assessing and Enhancing LLMs: A Physics and History Dataset and One-More-Check Pipeline Method
                                        Chaofan He , Chunhui Li , Tianyuan Han , and Liping Shen
                                        In Neural Information Processing - 30th International Conference, ICONIP 2023, Changsha, China, November 20-23, 2023, Proceedings, Part XIII , 2023
                                      4. GAN Latent Space Manipulation Based Augmentation for Unbalanced Emotion Datasets
                                        Yuhan Xiong , Jiawei You , and Liping Shen
                                        In International Joint Conference on Neural Networks, IJCNN 2023, Gold Coast, Australia, June 18-23, 2023 , 2023
                                      5. LongFNT: Long-Form Speech Recognition with Factorized Neural Transducer
                                        Xun Gong , Yu Wu , Jinyu Li , Shujie Liu , Rui Zhao , Xie Chen, and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
                                      6. Factorized AED: Factorized Attention-Based Encoder-Decoder for Text-Only Domain Adaptive ASR
                                        Xun Gong , Wei Wang , Hang Shao , Xie Chen, and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
                                      7. Exploring Binary Classification Loss for Speaker Verification
                                        Bing Han , Zhengyang Chen , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
                                      8. Improving Dino-Based Self-Supervised Speaker Verification with Progressive Cluster-Aware Training
                                        Bing Han , Wen Huang , Zhengyang Chen , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2023 - Workshops, Rhodes Island, Greece, June 4-10, 2023 , 2023
                                      9. Robust Audio-Visual ASR with Unified Cross-Modal Attention
                                        Jiahong Li , Chenda Li , Yifei Wu , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
                                      10. Target Sound Extraction with Variable Cross-Modality Clues
                                        Chenda Li , Yao Qian , Zhuo Chen , Dongmei Wang , Takuya Yoshioka , Shujie Liu , Yanmin Qian , and Michael Zeng
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
                                      11. Predictive Skim: Contrastive Predictive Coding for Low-Latency Online Speech Separation
                                        Chenda Li , Yifei Wu , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
                                      12. Multi-Speaker End-to-End Multi-Modal Speaker Diarization System for the MISP 2022 Challenge
                                        Tao Liu , Zhengyang Chen , Yanmin Qian , and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
                                      13. Joint Discriminator and Transfer Based Fast Domain Adaptation For End-To-End Speech Recognition
                                        Hang Shao , Tian Tan , Wei Wang , Xun Gong , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
                                      14. Lowbit Neural Network Quantization for Speaker Verification
                                        Haoyu Wang , Bei Liu , Yifei Wu , Zhengyang Chen , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2023 - Workshops, Rhodes Island, Greece, June 4-10, 2023 , 2023
                                      15. Wespeaker: A Research and Production Oriented Speaker Embedding Learning Toolkit
                                        Hongji Wang , Chengdong Liang , Shuai Wang , Zhengyang Chen , Binbin Zhang , Xu Xiang , Yanlei Deng , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
                                      16. HuBERT-AGG: Aggregated Representation Distillation of Hidden-Unit Bert for Robust Speech Recognition
                                        Wei Wang , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
                                      17. Light-Weight Visualvoice: Neural Network Quantization On Audio Visual Speech Separation
                                        Yifei Wu , Chenda Li , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2023 - Workshops, Rhodes Island, Greece, June 4-10, 2023 , 2023
                                      18. Code-Switching Text Generation and Injection in Mandarin-English ASR
                                        Haibin Yu , Yuxuan Hu , Yao Qian , Ma Jin , Linquan Liu , Shujie Liu , Yu Shi , Yanmin Qian , Edward Lin , and Michael Zeng
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
                                      19. Adaptive Large Margin Fine-Tuning For Robust Speaker Verification
                                        Leying Zhang , Zhengyang Chen , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
                                      20. ComSL: A Composite Speech-Language Model for End-to-End Speech-to-Text Translation
                                        Chenyang Le , Yao Qian , Long Zhou , Shujie Liu , Yanmin Qian , Michael Zeng , and Xuedong Huang
                                        In Advances in Neural Information Processing Systems 36: Annual Conference on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans, LA, USA, December 10 - 16, 2023 , 2023
                                      21. Exploring the Integration of Speech Separation and Recognition with Self-Supervised Learning Representation
                                        Yoshiki Masuyama , Xuankai Chang , Wangyou Zhang , Samuele Cornell , Zhong-Qiu Wang , Nobutaka Ono , Yanmin Qian , and Shinji Watanabe
                                        In IEEE Workshop on Applications of Signal Processing to Audio and Acoustics, WASPAA 2023, New Paltz, NY, USA, October 22-25, 2023 , 2023
                                      22. Software Design and User Interface of ESPnet-SE++: Speech Enhancement for Robust Speech Processing (espnet-v.202310) (Version 1)
                                        Yen-Ju Lu , Xuankai Chang , Chenda Li , Wangyou Zhang , Samuele Cornell , Zhaoheng Ni , Yoshiki Masuyama , Brian Yan , Robin Scheibler , Zhong-Qiu Wang , Yu Tsao , Yanmin Qian , and Shinji Watanabe
                                        Oct 2023
                                        Accessed on YYYY-MM-DD.
                                      23. Self-Supervised Learning with Cluster-Aware-DINO for High-Performance Robust Speaker Verification
                                        Bing Han , Zhengyang Chen , and Yanmin Qian
                                        CoRR, Oct 2023
                                      24. Attention-based Encoder-Decoder Network for End-to-End Neural Speaker Diarization with Target Speaker Attractor
                                        Zhengyang Chen , Bing Han , Shuai Wang , and Yanmin Qian
                                        CoRR, Oct 2023
                                      25. Whisper-KDQ: A Lightweight Whisper via Guided Knowledge Distillation and Quantization for Efficient ASR
                                        Hang Shao , Wei Wang , Bei Liu , Xun Gong , Haoyu Wang , and Yanmin Qian
                                        CoRR, Oct 2023
                                      26. Weakly-Supervised Speech Pre-training: A Case Study on Target Speech Recognition
                                        Wangyou Zhang , and Yanmin Qian
                                        CoRR, Oct 2023
                                      27. Adapting Multi-Lingual ASR Models for Handling Multiple Talkers
                                        Chenda Li , Yao Qian , Zhuo Chen , Naoyuki Kanda , Dongmei Wang , Takuya Yoshioka , Yanmin Qian , and Michael Zeng
                                        CoRR, Oct 2023
                                      28. InstructME: An Instruction Guided Music Edit And Remix Framework with Latent Diffusion Models
                                        Bing Han , Junyu Dai , Xuchen Song , Weituo Hao , Xinyan He , Dong Guo , Jitong Chen , Yuxuan Wang , and Yanmin Qian
                                        CoRR, Oct 2023
                                      29. Attention-based Encoder-Decoder End-to-End Neural Diarization with Embedding Enhancer
                                        Zhengyang Chen , Bing Han , Shuai Wang , and Yanmin Qian
                                        CoRR, Oct 2023
                                      30. USED: Universal Speaker Extraction and Diarization
                                        Junyi Ao , Mehmet Sinan Yildirim , Meng Ge , Shuai Wang , Ruijie Tao , Yanmin Qian , Liqun Deng , Longshuai Xiao , and Haizhou Li
                                        CoRR, Oct 2023
                                      31. Leveraging In-the-Wild Data for Effective Self-Supervised Pretraining in Speaker Recognition
                                        Shuai Wang , Qibing Bai , Qi Liu , Jianwei Yu , Zhengyang Chen , Bing Han , Yanmin Qian , and Haizhou Li
                                        CoRR, Oct 2023
                                      32. The second multi-channel multi-party meeting transcription challenge (M2MeT) 2.0): A benchmark for speaker-attributed ASR
                                        Yuhao Liang , Mohan Shi , Fan Yu , Yangze Li , Shiliang Zhang , Zhihao Du , Qian Chen , Lei Xie , Yanmin Qian , Jian Wu , Zhuo Chen , Kong Aik Lee , Zhijie Yan , and Hui Bu
                                        CoRR, Oct 2023
                                      33. Diffusion Conditional Expectation Model for Efficient and Robust Target Speech Extraction
                                        Leying Zhang , Yao Qian , Linfeng Yu , Heming Wang , Xinkai Wang , Hemin Yang , Long Zhou , Shujie Liu , Yanmin Qian , and Michael Zeng
                                        CoRR, Oct 2023
                                      34. Toward Universal Speech Enhancement for Diverse Input Conditions
                                        Wangyou Zhang , Kohei Saijo , Zhong-Qiu Wang , Shinji Watanabe , and Yanmin Qian
                                        CoRR, Oct 2023
                                      35. One-Shot Sensitivity-Aware Mixed Sparsity Pruning for Large Language Models
                                        Hang Shao , Bei Liu , and Yanmin Qian
                                        CoRR, Oct 2023
                                      36. FAT-HuBERT: Front-end Adaptive Training of Hidden-unit BERT for Distortion-Invariant Robust Speech Recognition
                                        Dongning Yang , Wei Wang , and Yanmin Qian
                                        CoRR, Oct 2023
                                      37. Speaker Adaptive Text-to-Speech With Timbre-Normalized Vector-Quantized Feature
                                        Chenpeng Du , Yiwei Guo , Xie Chen, and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2023
                                      38. Fast-Hubert: an Efficient Training Framework for Self-Supervised Speech Representation Learning
                                        Guanrou Yang , Ziyang Ma , Zhisheng Zheng , Yakun Song , Zhikang Niu , and Xie Chen
                                        In IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2023, Taipei, Taiwan, December 16-20, 2023 , Oct 2023
                                      39. Improving Few-Shot Learning for Talking Face System with TTS Data Augmentation
                                        Qi Chen , Ziyang Ma , Tao Liu , Xu Tan , Qu Lu , Kai Yu , and Xie Chen
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , Oct 2023
                                      40. Front-End Adapter: Adapting Front-End Input of Speech Based Self-Supervised Learning for Speech Recognition
                                        Xie Chen, Ziyang Ma , Changli Tang , Yujin Wang , and Zhisheng Zheng
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , Oct 2023
                                      41. Emodiff: Intensity Controllable Emotional Text-to-Speech with Soft-Label Guidance
                                        Yiwei Guo , Chenpeng Du , Xie Chen, and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , Oct 2023
                                      42. DAE-Talker: High Fidelity Speech-Driven Talking Face Generation with Diffusion Autoencoder
                                        Chenpeng Du , Qi Chen , Tianyu He , Xu Tan , Xie ChenKai Yu, Sheng Zhao , and Jiang Bian
                                        In Proceedings of the 31st ACM International Conference on Multimedia, MM 2023, Ottawa, ON, Canada, 29 October 2023- 3 November 2023 , Oct 2023
                                      43. Blank-regularized CTC for Frame Skipping in Neural Transducer
                                        Yifan Yang , Xiaoyu Yang , Liyong Guo , Zengwei Yao , Wei Kang , Fangjun Kuang , Long Lin , Xie Chen, and Daniel Povey
                                        CoRR, Oct 2023
                                      44. UniCATS: A Unified Context-Aware Text-to-Speech Framework with Contextual VQ-Diffusion and Vocoding
                                        Chenpeng Du , Yiwei Guo , Feiyu Shen , Zhijun Liu , Zheng Liang , Xie Chen, Shuai Wang , Hui Zhang , and Kai Yu
                                        CoRR, Oct 2023
                                      45. Improving Code-Switching and Named Entity Recognition in ASR with Speech Editing based Data Augmentation
                                        Zheng Liang , Zheshu Song , Ziyang Ma , Chenpeng Du , Kai Yu , and Xie Chen
                                        CoRR, Oct 2023
                                      46. Pushing the Limits of Unsupervised Unit Discovery for SSL Speech Representation
                                        Ziyang Ma , Zhisheng Zheng , Guanrou Yang , Yu Wang , Chao Zhang , and Xie Chen
                                        CoRR, Oct 2023
                                      47. Towards Effective and Compact Contextual Representation for Conformer Transducer Speech Recognition Systems
                                        Mingyu Cui , Jiawen Kang , Jiajun Deng , Xi Yin , Yutao Xie , Xie Chen, and Xunying Liu
                                        CoRR, Oct 2023
                                      48. DSE-TTS: Dual Speaker Embedding for Cross-Lingual Text-to-Speech
                                        Sen Liu , Yiwei Guo , Chenpeng Du , Xie Chen, and Kai Yu
                                        CoRR, Oct 2023
                                      49. Unsupervised Active Learning: Optimizing Labeling Cost-Effectiveness for Automatic Speech Recognition
                                        Zhisheng Zheng , Ziyang Ma , Yu Wang , and Xie Chen
                                        CoRR, Oct 2023
                                      50. VoiceFlow: Efficient Text-to-Speech with Rectified Flow Matching
                                        Yiwei Guo , Chenpeng Du , Ziyang Ma , Xie Chen, and Kai Yu
                                        CoRR, Oct 2023
                                      51. Towards Universal Speech Discrete Tokens: A Case Study for ASR and TTS
                                        Yifan Yang , Feiyu Shen , Chenpeng Du , Ziyang Ma , Kai Yu, Daniel Povey , and Xie Chen
                                        CoRR, Oct 2023
                                      52. Incorporating Class-based Language Model for Named Entity Recognition in Factorized Neural Transducer
                                        Peng Wang , Yifan Yang , Zheng Liang , Tian Tan , Shiliang Zhang , and Xie Chen
                                        CoRR, Oct 2023
                                      53. Improved Factorized Neural Transducer Model For text-only Domain Adaptation
                                        Junzhe Liu , Jianwei Yu , and Xie Chen
                                        CoRR, Oct 2023
                                      54. Leveraging Speech PTM, Text LLM, and Emotional TTS for Speech Emotion Recognition
                                        Ziyang Ma , Wen Wu , Zhisheng Zheng , Yiwei Guo , Qian Chen , Shiliang Zhang , and Xie Chen
                                        CoRR, Oct 2023
                                      55. Acoustic BPE for Speech Generation with Discrete Tokens
                                        Feiyu Shen , Yiwei Guo , Chenpeng Du , Xie Chen, and Kai Yu
                                        CoRR, Oct 2023
                                      56. Expressive TTS Driven by Natural Language Prompts Using Few Human Annotations
                                        Hanglei Zhang , Yiwei Guo , Sen Liu , Xie Chen, and Kai Yu
                                        CoRR, Oct 2023
                                      57. emotion2vec: Self-Supervised Pre-Training for Speech Emotion Representation
                                        Ziyang Ma , Zhisheng Zheng , Jiaxin Ye , Jinchao Li , Zhifu Gao , Shiliang Zhang , and Xie Chen
                                        CoRR, Oct 2023
                                      58. OPAL: Ontology-Aware Pretrained Language Model for End-to-End Task-Oriented Dialogue
                                        Zhi Chen , Yuncong Liu , Lu Chen , Su Zhu , Mengyue Wu, and Kai Yu
                                        Trans. Assoc. Comput. Linguistics, Oct 2023
                                      59. Transcribing Vocal Communications of Domestic Shiba lnu Dogs
                                        Jieyi Huang , Chunhao Zhang , Mengyue Wu , and Kenny Q. Zhu
                                        In Findings of the Association for Computational Linguistics: ACL 2023, Toronto, Canada, July 9-14, 2023 , Oct 2023
                                      60. Detection of Multiple Mental Disorders from Social Media with Two-Stream Psychiatric Experts
                                        Siyuan Chen , Zhiling Zhang , Mengyue Wu , and Kenny Q. Zhu
                                        In Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing, EMNLP 2023, Singapore, December 6-10, 2023 , Oct 2023
                                      61. Semantic Space Grounded Weighted Decoding for Multi-Attribute Controllable Dialogue Generation
                                        Zhiling Zhang , Mengyue Wu , and Kenny Q. Zhu
                                        In Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing, EMNLP 2023, Singapore, December 6-10, 2023 , Oct 2023
                                      62. Diverse and Vivid Sound Generation from Text Descriptions
                                        Guangwei Li , Xuenan Xu , Lingfeng Dai , Mengyue Wu, and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , Oct 2023
                                      63. Investigating Pooling Strategies and Loss Functions for Weakly-Supervised Text-to-Audio Grounding via Contrastive Learning
                                        Xuenan Xu , Mengyue Wu, and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2023 - Workshops, Rhodes Island, Greece, June 4-10, 2023 , Oct 2023
                                      64. BLAT: Bootstrapping Language-Audio Pre-training based on AudioSet Tag-guided Synthetic Data
                                        Xuenan Xu , Zhiling Zhang , Zelin Zhou , Pingyue Zhang , Zeyu Xie , Mengyue Wu , and Kenny Q. Zhu
                                        In Proceedings of the 31st ACM International Conference on Multimedia, MM 2023, Ottawa, ON, Canada, 29 October 2023- 3 November 2023 , Oct 2023
                                      65. LLM-empowered Chatbots for Psychiatrist and Patient Simulation: Application and Evaluation
                                        Siyuan Chen , Mengyue Wu , Kenny Q. Zhu , Kunyao Lan , Zhiling Zhang , and Lyuchun Cui
                                        CoRR, Oct 2023
                                      66. Enhance Temporal Relations in Audio Captioning with Sound Event Detection
                                        Zeyu Xie , Xuenan Xu , Mengyue Wu, and Kai Yu
                                        CoRR, Oct 2023
                                      67. Improving Audio Caption Fluency with Automatic Error Correction
                                        Hanxue Zhang , Zeyu Xie , Xuenan Xu , Mengyue Wu, and Kai Yu
                                        CoRR, Oct 2023
                                      68. A Large-scale Dataset for Audio-Language Representation Learning
                                        Luoyi Sun , Xuenan Xu , Mengyue Wu, and Weidi Xie
                                        CoRR, Oct 2023
                                      69. Does My Dog "Speak" Like Me? The Acoustic Correlation between Pet Dogs and Their Human Owners
                                        Jieyi Huang , Chunhao Zhang , Yufei Wang , Mengyue Wu , and Kenny Q. Zhu
                                        CoRR, Oct 2023
                                      70. Towards Lexical Analysis of Dog Vocalizations via Online Videos
                                        Yufei Wang , Chunhao Zhang , Jieyi Huang , Mengyue Wu , and Kenny Q. Zhu
                                        CoRR, Oct 2023
                                      71. PsyEval: A Comprehensive Large Language Model Evaluation Benchmark for Mental Health
                                        Haoan Jin , Siyuan Chen , Mengyue Wu , and Kenny Q. Zhu
                                        CoRR, Oct 2023
                                      72. A Heterogeneous Graph to Abstract Syntax Tree Framework for Text-to-SQL
                                        Ruisheng Cao , Lu Chen, Jieyu Li , Hanchong Zhang , Hongshen Xu , Wangyou Zhang , and Kai Yu
                                        IEEE Trans. Pattern Anal. Mach. Intell., Oct 2023
                                      73. Speech Enhancement With Integration of Neural Homomorphic Synthesis and Spectral Masking
                                        Wenbin Jiang , and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2023
                                      74. SPM: A Split-Parsing Method for Joint Multi-Intent Detection and Slot Filling
                                        Sheng Jiang , Su Zhu , Ruisheng Cao , Qingliang Miao , and Kai Yu
                                        In Proceedings of the The 61st Annual Meeting of the Association for Computational Linguistics: Industry Track, ACL 2023, Toronto, Canada, July 9-14, 2023 , Oct 2023
                                      75. Exploring Schema Generalizability of Text-to-SQL
                                        Jieyu Li , Lu Chen, Ruisheng Cao , Su Zhu , Hongshen Xu , Zhi Chen , Hanchong Zhang , and Kai Yu
                                        In Findings of the Association for Computational Linguistics: ACL 2023, Toronto, Canada, July 9-14, 2023 , Oct 2023
                                      76. TeCS: A Dataset and Benchmark for Tense Consistency of Machine Translation
                                        Yiming Ai , Zhiwei He , Kai Yu, and Rui Wang
                                        In Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers), ACL 2023, Toronto, Canada, July 9-14, 2023 , Oct 2023
                                      77. CSS: A Large-scale Cross-schema Chinese Text-to-SQL Medical Dataset
                                        Hanchong Zhang , Jieyu Li , Lu Chen, Ruisheng Cao , Yunyan Zhang , Yu Huang , Yefeng Zheng , and Kai Yu
                                        In Findings of the Association for Computational Linguistics: ACL 2023, Toronto, Canada, July 9-14, 2023 , Oct 2023
                                      78. ACT-SQL: In-Context Learning for Text-to-SQL with Automatically-Generated Chain-of-Thought
                                        Hanchong Zhang , Ruisheng Cao , Lu Chen, Hongshen Xu , and Kai Yu
                                        In Findings of the Association for Computational Linguistics: EMNLP 2023, Singapore, December 6-10, 2023 , Oct 2023
                                      79. Multi-Speaker Multi-Lingual VQTTS System for LIMMITS 2023 Challenge
                                        Chenpeng Du , Yiwei Guo , Feiyu Shen , and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , Oct 2023
                                      80. DiffVoice: Text-to-Speech with Latent Diffusion
                                        Zhijun Liu , Yiwei Guo , and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , Oct 2023
                                      81. Large Language Models Are Semi-Parametric Reinforcement Learning Agents
                                        Danyang Zhang , Lu Chen, Situo Zhang , Hongshen Xu , Zihan Zhao , and Kai Yu
                                        In Advances in Neural Information Processing Systems 36: Annual Conference on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans, LA, USA, December 10 - 16, 2023 , Oct 2023
                                      82. Mobile-Env: A Universal Platform for Training and Evaluation of Mobile Interaction
                                        Danyang Zhang , Lu Chen, and Kai Yu
                                        CoRR, Oct 2023
                                      83. SciEval: A Multi-Level Large Language Model Evaluation Benchmark for Scientific Research
                                        Liangtai Sun , Yang Han , Zihan Zhao , Da Ma , Zhennan Shen , Baocai Chen , Lu Chen, and Kai Yu
                                        CoRR, Oct 2023
                                      84. ASTormer: An AST Structure-aware Transformer Decoder for Text-to-SQL
                                        Ruisheng Cao , Hanchong Zhang , Hongshen Xu , Jieyu Li , Da Ma , Lu Chen, and Kai Yu
                                        CoRR, Oct 2023
                                      85. DiffDub: Person-generic Visual Dubbing Using Inpainting Renderer with Diffusion Auto-encoder
                                        Tao Liu , Chenpeng Du , Shuai Fan , Feilong Chen , and Kai Yu
                                        CoRR, Oct 2023
                                      86. SEF-VC: Speaker Embedding Free Zero-Shot Voice Conversion with Cross Attention
                                        Junjie Li , Yiwei Guo , Xie Chen, and Kai Yu
                                        CoRR, Oct 2023

                                      2022

                                      1. Heterogeneous Graph Representation for Knowledge Tracing
                                        Jisen Chen , Jian Shen , Ting Long , Liping Shen, Weinan Zhang , and Yong Yu
                                        In Neural Information Processing - 29th International Conference, ICONIP 2022, Virtual Event, November 22-26, 2022, Proceedings, Part I , Oct 2022
                                      2. A simple but practical method: How to improve the usage of entities in the Chinese question generation
                                        Haoze Yang , Kunyao Lan , Jiawei You , and Liping Shen
                                        In International Joint Conference on Neural Networks, IJCNN 2022, Padua, Italy, July 18-23, 2022 , Oct 2022
                                      3. From Uniform Models To Generic Representations: Stock Return Prediction With Pre-training
                                        Jiawei You , Tianyuan Han , and Liping Shen
                                        In International Joint Conference on Neural Networks, IJCNN 2022, Padua, Italy, July 18-23, 2022 , Oct 2022
                                      4. WavLM: Large-Scale Self-Supervised Pre-Training for Full Stack Speech Processing
                                        Sanyuan Chen , Chengyi Wang , Zhengyang Chen , Yu Wu , Shujie Liu , Zhuo Chen , Jinyu Li , Naoyuki Kanda , Takuya Yoshioka , Xiong Xiao , Jian Wu , Long Zhou , Shuo Ren , Yanmin Qian , Yao Qian , Jian Wu , Michael Zeng , Xiangzhan Yu , and Furu Wei
                                        IEEE J. Sel. Top. Signal Process., Oct 2022
                                      5. Optimizing Data Usage for Low-Resource Speech Recognition
                                        Yanmin Qian , and Zhikai Zhou
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2022
                                      6. Dual-Path Modeling With Memory Embedding Model for Continuous Speech Separation
                                        Chenda Li , Zhuo Chen , and Yanmin Qian
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2022
                                      7. Layer-Wise Fast Adaptation for End-to-End Multi-Accent Speech Recognition
                                        Yanmin Qian , Xun Gong , and Houjun Huang
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2022
                                      8. End-to-End Dereverberation, Beamforming, and Speech Recognition in a Cocktail Party
                                        Wangyou Zhang , Xuankai Chang , Christoph Böddeker , Tomohiro Nakatani , Shinji Watanabe , and Yanmin Qian
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2022
                                      9. Time-Domain Audio-Visual Speech Separation on Low Quality Videos
                                        Yifei Wu , Chenda Li , Jinfeng Bai , Zhongqin Wu , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      10. Skim: Skipping Memory Lstm for Low-Latency Real-Time Continuous Speech Separation
                                        Chenda Li , Lei Yang , Weiqin Wang , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      11. Large-Scale Self-Supervised Speech Representation Learning for Automatic Speaker Verification
                                        Zhengyang Chen , Sanyuan Chen , Yu Wu , Yao Qian , Chengyi Wang , Shujie Liu , Yanmin Qian , and Michael Zeng
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      12. Local Information Modeling with Self-Attention for Speaker Verification
                                        Bing Han , Zhengyang Chen , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      13. Punctuation Prediction for Streaming On-Device Speech Recognition
                                        Zhikai Zhou , Tian Tan , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      14. MLP-SVNET: A Multi-Layer Perceptrons Based Network for Speaker Verification
                                        Bing Han , Zhengyang Chen , Bei Liu , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      15. Self-Knowledge Distillation via Feature Enhancement for Speaker Verification
                                        Bei Liu , Haoyu Wang , Zhengyang Chen , Shuai Wang , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      16. Optimizing Alignment of Speech and Language Latent Spaces for End-To-End Speech Recognition and Understanding
                                        Wei Wang , Shuo Ren , Yao Qian , Shujie Liu , Yu Shi , Yanmin Qian , and Michael Zeng
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      17. Exploring Effective Data Utilization for Low-Resource Speech Recognition
                                        Zhikai Zhou , Wei Wang , Wangyou Zhang , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      18. Summary on the ICASSP 2022 Multi-Channel Multi-Party Meeting Transcription Grand Challenge
                                        Fan Yu , Shiliang Zhang , Pengcheng Guo , Yihui Fu , Zhihao Du , Siqi Zheng , Weilong Huang , Lei Xie , Zheng-Hua Tan , DeLiang Wang , Yanmin Qian , Kong Aik Lee , Zhijie Yan , Bin Ma , Xin Xu , and Hui Bu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      19. The Sjtu System For Multimodal Information Based Speech Processing Challenge 2021
                                        Wei Wang , Xun Gong , Yifei Wu , Zhikai Zhou , Chenda Li , Wangyou Zhang , Bing Han , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      20. Attentive Feature Fusion for Robust Speaker Verification
                                        Bei Liu , Zhengyang Chen , and Yanmin Qian
                                        In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
                                      21. Dual Path Embedding Learning for Speaker Verification with Triplet Attention
                                        Bei Liu , Zhengyang Chen , and Yanmin Qian
                                        In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
                                      22. DF-ResNet: Boosting Speaker Verification Performance with Depth-First Design
                                        Bei Liu , Zhengyang Chen , Shuai Wang , Haoyu Wang , Bing Han , and Yanmin Qian
                                        In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
                                      23. Enroll-Aware Attentive Statistics Pooling for Target Speaker Verification
                                        Leying Zhang , Zhengyang Chen , and Yanmin Qian
                                        In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
                                      24. MSDWild: Multi-modal Speaker Diarization Dataset in the Wild
                                        Tao Liu , Shuai Fan , Xu Xiang , Hongbo Song , Shaoxiong Lin , Jiaqi Sun , Tianyuan Han , Siyuan Chen , Binwei Yao , Sen Liu , Yifei Wu , Yanmin Qian , and Kai Yu
                                        In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
                                      25. Knowledge Transfer and Distillation from Autoregressive to Non-Autoregessive Speech Recognition
                                        Xun Gong , Zhikai Zhou , and Yanmin Qian
                                        In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
                                      26. Self-Supervised Speaker Verification Using Dynamic Loss-Gate and Label Correction
                                        Bing Han , Zhengyang Chen , and Yanmin Qian
                                        In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
                                      27. Separating Long-Form Speech with Group-wise Permutation Invariant Training
                                        Wangyou Zhang , Zhuo Chen , Naoyuki Kanda , Shujie Liu , Jinyu Li , Sefik Emre Eskimez , Takuya Yoshioka , Xiong Xiao , Zhong Meng , Yanmin Qian , and Furu Wei
                                        In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
                                      28. ESPnet-SE++: Speech Enhancement for Robust Speech Recognition, Translation, and Understanding
                                        Yen-Ju Lu , Xuankai Chang , Chenda Li , Wangyou Zhang , Samuele Cornell , Zhaoheng Ni , Yoshiki Masuyama , Brian Yan , Robin Scheibler , Zhong-Qiu Wang , Yu Tsao , Yanmin Qian , and Shinji Watanabe
                                        In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
                                      29. Improving Speech Separation with Knowledge Distilled from Self-supervised Pre-trained Models
                                        Bowen Qu , Chenda Li , Jinfeng Bai , and Yanmin Qian
                                        In 13th International Symposium on Chinese Spoken Language Processing, ISCSLP 2022, Singapore, December 11-14, 2022 , Oct 2022
                                      30. Text-Informed Knowledge Distillation for Robust Speech Enhancement and Recognition
                                        Wei Wang , Wangyou Zhang , Shaoxiong Lin , and Yanmin Qian
                                        In 13th International Symposium on Chinese Spoken Language Processing, ISCSLP 2022, Singapore, December 11-14, 2022 , Oct 2022
                                      31. Medical Difficult Airway Detection using Speech Technology
                                        Zhikai Zhou , Shuang Cao , Zhengyang Chen , Bei Liu , Ming Xia , Hong Jiang , and Yanmin Qian
                                        In 13th International Symposium on Chinese Spoken Language Processing, ISCSLP 2022, Singapore, December 11-14, 2022 , Oct 2022
                                      32. Speaking style compensation on synthetic audio for robust keyword spotting
                                        Houjun Huang , and Yanmin Qian
                                        In 13th International Symposium on Chinese Spoken Language Processing, ISCSLP 2022, Singapore, December 11-14, 2022 , Oct 2022
                                      33. The Conversational Short-phrase Speaker Diarization (CSSD) Task: Dataset, Evaluation Metric and Baselines
                                        Gaofeng Cheng , Yifan Chen , Runyan Yang , Qingxuan Li , Zehui Yang , Lingxuan Ye , Pengyuan Zhang , Qingqing Zhang , Lei Xie , Yanmin Qian , Kong Aik Lee , and Yonghong Yan
                                        In 13th International Symposium on Chinese Spoken Language Processing, ISCSLP 2022, Singapore, December 11-14, 2022 , Oct 2022
                                      34. The X-Lance Speaker Diarization System for the Conversational Short-phrase Speaker Diarization Challenge 2022
                                        Tao Liu , Xu Xiang , Zhengyang Chen , Bing Han , Kai Yu, and Yanmin Qian
                                        In 13th International Symposium on Chinese Spoken Language Processing, ISCSLP 2022, Singapore, December 11-14, 2022 , Oct 2022
                                      35. End-to-End Multi-Speaker ASR with Independent Vector Analysis
                                        Robin Scheibler , Wangyou Zhang , Xuankai Chang , Shinji Watanabe , and Yanmin Qian
                                        In IEEE Spoken Language Technology Workshop, SLT 2022, Doha, Qatar, January 9-12, 2023 , Oct 2022
                                      36. A Comprehensive Study on Self-Supervised Distillation for Speaker Representation Learning
                                        Zhengyang Chen , Yao Qian , Bing Han , Yanmin Qian , and Michael Zeng
                                        In IEEE Spoken Language Technology Workshop, SLT 2022, Doha, Qatar, January 9-12, 2023 , Oct 2022
                                      37. The SJTU X-LANCE Lab System for CNSRC 2022
                                        Zhengyang Chen , Bei Liu , Bing Han , Leying Zhang , and Yanmin Qian
                                        CoRR, Oct 2022
                                      38. SJTU-AISPEECH System for VoxCeleb Speaker Recognition Challenge 2022
                                        Zhengyang Chen , Bing Han , Xu Xiang , Houjun Huang , Bei Liu , and Yanmin Qian
                                        CoRR, Oct 2022
                                      39. Build a SRE Challenge System: Lessons from VoxSRC 2022 and CNSRC 2022
                                        Zhengyang Chen , Bing Han , Xu Xiang , Houjun Huang , Bei Liu , and Yanmin Qian
                                        CoRR, Oct 2022
                                      40. Factorized Neural Transducer for Efficient Language Model Adaptation
                                        Xie Chen, Zhong Meng , Sarangarajan Parthasarathy , and Jinyu Li
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      41. VQTTS: High-Fidelity Text-to-Speech Synthesis with Self-Supervised VQ Acoustic Feature
                                        Chenpeng Du , Yiwei Guo , Xie Chen, and Kai Yu
                                        In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
                                      42. Internal Language Model Adaptation with Text-Only Data for End-to-End Speech Recognition
                                        Zhong Meng , Yashesh Gaur , Naoyuki Kanda , Jinyu Li , Xie Chen , Yu Wu , and Yifan Gong
                                        In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
                                      43. Exploring Effective Distillation of Self-Supervised Speech Models for Automatic Speech Recognition
                                        Yujin Wang , Changli Tang , Ziyang Ma , Zhisheng Zheng , Xie Chen, and Wei-Qiang Zhang
                                        CoRR, Oct 2022
                                      44. MT4SSL: Boosting Self-Supervised Speech Representation Learning by Integrating Multiple Targets
                                        Ziyang Ma , Zhisheng Zheng , Changli Tang , Yujin Wang , and Xie Chen
                                        CoRR, Oct 2022
                                      45. EmoDiff: Intensity Controllable Emotional Text-to-Speech with Soft-Label Guidance
                                        Yiwei Guo , Chenpeng Du , Xie Chen, and Kai Yu
                                        CoRR, Oct 2022
                                      46. Exploring Effective Fusion Algorithms for Speech Based Self-Supervised Learning Models
                                        Changli Tang , Yujin Wang , Xie Chen, and Wei-Qiang Zhang
                                        CoRR, Oct 2022
                                      47. D4: a Chinese Dialogue Dataset for Depression-Diagnosis-Oriented Chat
                                        Binwei Yao , Chao Shi , Likai Zou , Lingfeng Dai , Mengyue WuLu Chen, Zhen Wang , and Kai Yu
                                        In Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing, EMNLP 2022, Abu Dhabi, United Arab Emirates, December 7-11, 2022 , Oct 2022
                                      48. Symptom Identification for Interpretable Detection of Multiple Mental Disorders on Social Media
                                        Zhiling Zhang , Siyuan Chen , Mengyue Wu , and Kenny Q. Zhu
                                        In Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing, EMNLP 2022, Abu Dhabi, United Arab Emirates, December 7-11, 2022 , Oct 2022
                                      49. Category-Adapted Sound Event Enhancement with Weakly Labeled Data
                                        Guangwei Li , Xuenan Xu , Heinrich Dinkel , Mengyue Wu, and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      50. Diversity-Controllable and Accurate Audio Captioning Based on Neural Condition
                                        Xuenan Xu , Mengyue Wu, and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      51. Can Audio Captions Be Evaluated With Image Caption Metrics?
                                        Zelin Zhou , Zhiling Zhang , Xuenan Xu , Zeyu Xie , Mengyue Wu , and Kenny Q. Zhu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      52. Navigating Audio-Visual Event Detection Across Mismatched Modalities
                                        Guangwei Li , Xuenan Xu , Mengyue Wu, and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      53. Audio-Text Retrieval in Context
                                        Siyu Lou , Xuenan Xu , Mengyue Wu, and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      54. Climate and Weather: Inspecting Depression Detection via Emotion Recognition
                                        Wen Wu , Mengyue Wu, and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      55. Psychiatric Scale Guided Risky Post Screening for Early Detection of Depression
                                        Zhiling Zhang , Siyuan Chen , Mengyue Wu , and Kenny Q. Zhu
                                        In Proceedings of the Thirty-First International Joint Conference on Artificial Intelligence, IJCAI 2022, Vienna, Austria, 23-29 July 2022 , Oct 2022
                                      56. A Comprehensive Survey of Automated Audio Captioning
                                        Xuenan Xu , Mengyue Wu, and Kai Yu
                                        CoRR, Oct 2022
                                      57. DialogZoo: Large-Scale Dialog-Oriented Task Learning
                                        Zhi Chen , Jijia Bao , Lu Chen, Yuncong Liu , Da Ma , Bei Chen , Mengyue Wu , Su Zhu , Jian-Guang Lou , and Kai Yu
                                        CoRR, Oct 2022
                                      58. Data augmentation based non-parallel voice conversion with frame-level speaker disentangler
                                        Bo Chen , Zhihang Xu , and Kai Yu
                                        Speech Commun., Oct 2022
                                      59. Phone-Level Prosody Modelling With GMM-Based MDN for Diverse and Controllable Speech Synthesis
                                        Chenpeng Du , and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2022
                                      60. Neural Fusion for Voice Cloning
                                        Bo Chen , Chenpeng Du , and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2022
                                      61. META-GUI: Towards Multi-modal Conversational Agents on Mobile GUI
                                        Liangtai Sun , Xingyu Chen , Lu Chen, Tianle Dai , Zichen Zhu, and Kai Yu
                                        In Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing, EMNLP 2022, Abu Dhabi, United Arab Emirates, December 7-11, 2022 , Oct 2022
                                      62. AdapterShare: Task Correlation Modeling with Adapter Differentiation
                                        Zhi Chen , Bei Chen , Lu ChenKai Yu, and Jian-Guang Lou
                                        In Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing, EMNLP 2022, Abu Dhabi, United Arab Emirates, December 7-11, 2022 , Oct 2022
                                      63. LatticeBART: Lattice-to-Lattice Pre-Training for Speech Recognition
                                        Lingfeng Dai , Lu Chen, Zhikai Zhou , and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      64. Text Adaptive Detection for Customizable Keyword Spotting
                                        Yu Xi , Tian Tan , Wangyou Zhang , Baochen Yang , and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      65. Unsupervised Word-Level Prosody Tagging for Controllable Speech Synthesis
                                        Yiwei Guo , Chenpeng Du , and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      66. The AISP-SJTU Simultaneous Translation System for IWSLT 2022
                                        Qinpei Zhu , Renshou Wu , Guangfeng Liu , Xinyu Zhu , Xingyu Chen , Yang Zhou , Qingliang Miao , Rui Wang , and Kai Yu
                                        In Proceedings of the 19th International Conference on Spoken Language Translation, IWSLT@ACL 2022, Dublin, Ireland (in-person and online), May 26-27, 2022 , Oct 2022
                                      67. TIE: Topological Information Enhanced Structural Reading Comprehension on Web Pages
                                        Zihan Zhao , Lu Chen, Ruisheng Cao , Hongshen Xu , Xingyu Chen , and Kai Yu
                                        In Proceedings of the 2022 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, NAACL 2022, Seattle, WA, United States, July 10-15, 2022 , Oct 2022
                                      68. UniDU: Towards A Unified Generative Dialogue Understanding Framework
                                        Zhi Chen , Lu Chen , Bei Chen , Libo Qin , Yuncong Liu , Su Zhu , Jian-Guang Lou , and Kai Yu
                                        In Proceedings of the 23rd Annual Meeting of the Special Interest Group on Discourse and Dialogue, SIGDIAL 2022, Edinburgh, UK, 07-09 September 2022 , Oct 2022
                                      69. The AISP-SJTU Translation System for WMT 2022
                                        Guangfeng Liu , Qinpei Zhu , Xingyu Chen , Renjie Feng , Jianxin Ren , Renshou Wu , Qingliang Miao , Rui Wang , and Kai Yu
                                        In Proceedings of the Seventh Conference on Machine Translation, WMT 2022, Abu Dhabi, United Arab Emirates (Hybrid), December 7-8, 2022 , Oct 2022

                                      2021

                                      1. Modified Magnitude-Phase Spectrum Information for Spoofing Detection
                                        Jichen Yang , Hongji Wang , Rohan Kumar Das , and Yanmin Qian
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2021
                                      2. Audio-Visual Deep Neural Network for Robust Person Verification
                                        Yanmin Qian , Zhengyang Chen , and Shuai Wang
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2021
                                      3. Dual-Path Modeling for Long Recording Speech Separation in Meetings
                                        Chenda Li , Zhuo Chen , Yi Luo , Cong Han , Tianyan Zhou , Keisuke Kinoshita , Marc Delcroix , Shinji Watanabe , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
                                      4. Self-Supervised Learning Based Domain Adaptation for Robust Speaker Verification
                                        Zhengyang Chen , Shuai Wang , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
                                      5. SynAug: Synthesis-Based Data Augmentation for Text-Dependent Speaker Verification
                                        Chenpeng Du , Bing Han , Shuai Wang , Yanmin Qian , and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
                                      6. Unit Selection Synthesis Based Data Augmentation for Fixed Phrase Speaker Verification
                                        Houjun Huang , Xu Xiang , Fei Zhao , Shuai Wang , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
                                      7. AISpeech-SJTU Accent Identification System for the Accented English Speech Recognition Challenge
                                        Houjun Huang , Xu Xiang , Yexin Yang , Rao Ma , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
                                      8. AISpeech-SJTU ASR System for the Accented English Speech Recognition Challenge
                                        Tian Tan , Yizhou Lu , Rao Ma , Sen Zhu , Jiaqi Guo , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
                                      9. Towards Data Selection on TTS Data for Children’s Speech Recognition
                                        Wei Wang , Zhikai Zhou , Yizhou Lu , Hongji Wang , Chenpeng Du , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
                                      10. End-to-End Dereverberation, Beamforming, and Speech Recognition with Improved Numerical Stability and Advanced Frontend
                                        Wangyou Zhang , Christoph Böddeker , Shinji Watanabe , Tomohiro Nakatani , Marc Delcroix , Keisuke Kinoshita , Tsubasa Ochiai , Naoyuki Kamo , Reinhold Haeb-Umbach , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
                                      11. The Accented English Speech Recognition Challenge 2020: Open Datasets, Tracks, Baselines, Results and Methods
                                        Xian Shi , Fan Yu , Yizhou Lu , Yuhao Liang , Qiangze Feng , Daliang Wang , Yanmin Qian , and Lei Xie
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
                                      12. Convolutive Transfer Function Invariant SDR Training Criteria for Multi-Channel Reverberant Speech Separation
                                        Christoph Böddeker , Wangyou Zhang , Tomohiro Nakatani , Keisuke Kinoshita , Tsubasa Ochiai , Marc Delcroix , Naoyuki Kamo , Yanmin Qian , and Reinhold Haeb-Umbach
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
                                      13. Layer-Wise Fast Adaptation for End-to-End Multi-Accent Speech Recognition
                                        Xun Gong , Yizhou Lu , Zhikai Zhou , and Yanmin Qian
                                        In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
                                      14. Knowledge Distillation from Multi-Modality to Single-Modality for Person Verification
                                        Leying Zhang , Zhengyang Chen , and Yanmin Qian
                                        In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
                                      15. Basis-MelGAN: Efficient Neural Vocoder Based on Audio Decomposition
                                        Zhengxi Liu , and Yanmin Qian
                                        In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
                                      16. The SJTU System for Short-Duration Speaker Verification Challenge 2021
                                        Bing Han , Zhengyang Chen , Zhikai Zhou , and Yanmin Qian
                                        In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
                                      17. Audio-Visual Multi-Talker Speech Recognition in a Cocktail Party
                                        Yifei Wu , Chenda Li , Song Yang , Zhongqin Wu , and Yanmin Qian
                                        In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
                                      18. Speaker Embedding Augmentation with Noise Distribution Matching
                                        Xun Gong , Zhengyang Chen , Yexin Yang , Shuai Wang , Lan Wang , and Yanmin Qian
                                        In 12th International Symposium on Chinese Spoken Language Processing, ISCSLP 2021, Hong Kong, January 24-27, 2021 , Oct 2021
                                      19. Revisiting the Statistics Pooling Layer in Deep Speaker Embedding Learning
                                        Shuai Wang , Yexin Yang , Yanmin Qian , and Kai Yu
                                        In 12th International Symposium on Chinese Spoken Language Processing, ISCSLP 2021, Hong Kong, January 24-27, 2021 , Oct 2021
                                      20. Data Augmentation for end-to-end Code-Switching Speech Recognition
                                        Chenpeng Du , Hao Li , Yizhou Lu , Lan Wang , and Yanmin Qian
                                        In IEEE Spoken Language Technology Workshop, SLT 2021, Shenzhen, China, January 19-22, 2021 , Oct 2021
                                      21. Dual-Path RNN for Long Recording Speech Separation
                                        Chenda Li , Yi Luo , Cong Han , Jinyu Li , Takuya Yoshioka , Tianyan Zhou , Marc Delcroix , Keisuke Kinoshita , Christoph Böddeker , Yanmin Qian , Shinji Watanabe , and Zhuo Chen
                                        In IEEE Spoken Language Technology Workshop, SLT 2021, Shenzhen, China, January 19-22, 2021 , Oct 2021
                                      22. Closing the Gap Between Time-Domain Multi-Channel Speech Enhancement on Real and Simulation Conditions
                                        Wangyou Zhang , Jing Shi , Chenda Li , Shinji Watanabe , and Yanmin Qian
                                        In IEEE Workshop on Applications of Signal Processing to Audio and Acoustics, WASPAA 2021, New Paltz, NY, USA, October 17-20, 2021 , Oct 2021
                                      23. Towards Duration Robust Weakly Supervised Sound Event Detection
                                        Heinrich Dinkel , Mengyue Wu, and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2021
                                      24. Voice Activity Detection in the Wild: A Data-Driven Approach Using Teacher-Student Training
                                        Heinrich Dinkel , Shuai Wang , Xuenan Xu , Mengyue Wu, and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2021
                                      25. Building Interpretable Interaction Trees for Deep NLP Models
                                        Die Zhang , Hao Zhang , Huilin Zhou , Xiaoyi Bao , Da Huo , Ruizhao Chen , Xu Cheng , Mengyue Wu, and Quanshi Zhang
                                        In Thirty-Fifth AAAI Conference on Artificial Intelligence, AAAI 2021, Thirty-Third Conference on Innovative Applications of Artificial Intelligence, IAAI 2021, The Eleventh Symposium on Educational Advances in Artificial Intelligence, EAAI 2021, Virtual Event, February 2-9, 2021 , Oct 2021
                                      26. Decoupled Dialogue Modeling and Semantic Parsing for Multi-Turn Text-to-SQL
                                        Zhi Chen , Lu Chen, Hanqi Li , Ruisheng Cao , Da Ma , Mengyue Wu, and Kai Yu
                                        In Findings of the Association for Computational Linguistics: ACL/IJCNLP 2021, Online Event, August 1-6, 2021 , Oct 2021
                                      27. Enriching Ontology with Temporal Commonsense for Low-Resource Audio Tagging
                                        Zhiling Zhang , Zelin Zhou , Haifeng Tang , Guangwei Li , Mengyue Wu , and Kenny Q. Zhu
                                        In CIKM ’21: The 30th ACM International Conference on Information and Knowledge Management, Virtual Event, Queensland, Australia, November 1 - 5, 2021 , Oct 2021
                                      28. Text-to-Audio Grounding: Building Correspondence Between Captions and Sound Events
                                        Xuenan Xu , Heinrich Dinkel , Mengyue Wu, and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
                                      29. Investigating Local and Global Information for Automated Audio Captioning with Transfer Learning
                                        Xuenan Xu , Heinrich Dinkel , Mengyue Wu, Zeyu Xie , and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
                                      30. A Lightweight Framework for Online Voice Activity Detection in the Wild
                                        Xuenan Xu , Heinrich Dinkel , Mengyue Wu, and Kai Yu
                                        In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
                                      31. Audio Caption in a Car Setting with a Sentence-Level Loss
                                        Xuenan Xu , Heinrich Dinkel , Mengyue Wu, and Kai Yu
                                        In 12th International Symposium on Chinese Spoken Language Processing, ISCSLP 2021, Hong Kong, January 24-27, 2021 , Oct 2021
                                      32. DEPA: Self-Supervised Audio Embedding for Depression Detection
                                        Pingyue Zhang , Mengyue Wu, Heinrich Dinkel , and Kai Yu
                                        In MM ’21: ACM Multimedia Conference, Virtual Event, China, October 20 - 24, 2021 , Oct 2021
                                      33. LET: Linguistic Knowledge Enhanced Graph Transformer for Chinese Short Text Matching
                                        Boer Lyu , Lu Chen , Su Zhu , and Kai Yu
                                        In Thirty-Fifth AAAI Conference on Artificial Intelligence, AAAI 2021, Thirty-Third Conference on Innovative Applications of Artificial Intelligence, IAAI 2021, The Eleventh Symposium on Educational Advances in Artificial Intelligence, EAAI 2021, Virtual Event, February 2-9, 2021 , Oct 2021
                                      34. LGESQL: Line Graph Enhanced Text-to-SQL Model with Mixed Local and Non-Local Relations
                                        Ruisheng Cao , Lu Chen , Zhi Chen , Yanbin Zhao , Su Zhu , and Kai Yu
                                        In Proceedings of the 59th Annual Meeting of the Association for Computational Linguistics and the 11th International Joint Conference on Natural Language Processing, ACL/IJCNLP 2021, (Volume 1: Long Papers), Virtual Event, August 1-6, 2021 , Oct 2021
                                      35. WebSRC: A Dataset for Web-Based Structural Reading Comprehension
                                        Xingyu Chen , Zihan Zhao , Lu Chen, Jiabao Ji , Danyang Zhang , Ao Luo , Yuxuan Xiong , and Kai Yu
                                        In Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing, EMNLP 2021, Virtual Event / Punta Cana, Dominican Republic, 7-11 November, 2021 , Oct 2021
                                      36. Glyph Enhanced Chinese Character Pre-Training for Lexical Sememe Prediction
                                        Boer Lyu , Lu Chen, and Kai Yu
                                        In Findings of the Association for Computational Linguistics: EMNLP 2021, Virtual Event / Punta Cana, Dominican Republic, 16-20 November, 2021 , Oct 2021
                                      37. Class-Based Neural Network Language Model for Second-Pass Rescoring in ASR
                                        Lingfeng Dai , Qi Liu , and Kai Yu
                                        In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
                                      38. Rich Prosody Diversity Modelling with Phone-Level Mixture Density Network
                                        Chenpeng Du , and Kai Yu
                                        In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
                                      39. ShadowGNN: Graph Projection Neural Network for Text-to-SQL Parser
                                        Zhi Chen , Lu Chen, Yanbin Zhao , Ruisheng Cao , Zihan Xu , Su Zhu , and Kai Yu
                                        In Proceedings of the 2021 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, NAACL-HLT 2021, Online, June 6-11, 2021 , Oct 2021
                                      40. Few-Shot NLU with Vector Projection Distance and Abstract Triangular CRF
                                        Su Zhu , Lu Chen, Ruisheng Cao , Zhi Chen , Qingliang Miao , and Kai Yu
                                        In Natural Language Processing and Chinese Computing - 10th CCF International Conference, NLPCC 2021, Qingdao, China, October 13-17, 2021, Proceedings, Part I , Oct 2021
                                      41. Relation-Aware Multi-hop Reasoning forVisual Dialog
                                        Yao Zhao , Lu Chen, and Kai Yu
                                        In Natural Language Processing and Chinese Computing - 10th CCF International Conference, NLPCC 2021, Qingdao, China, October 13-17, 2021, Proceedings, Part I , Oct 2021
                                      42. Mixture Density Network for Phone-Level Prosody Modelling in Speech Synthesis
                                        Chenpeng Du , and Kai Yu
                                        CoRR, Oct 2021
                                      43. Diverse and Controllable Speech Synthesis with GMM-Based Phone-Level Prosody Modelling
                                        Chenpeng Du , and Kai Yu
                                        CoRR, Oct 2021

                                      2020

                                      1. Improving End-to-End Single-Channel Multi-Talker Speech Recognition
                                        Wangyou Zhang , Xuankai Chang , Yanmin Qian , and Shinji Watanabe
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2020
                                      2. Data Augmentation Using Deep Generative Models for Embedding Based Speaker Recognition
                                        Shuai Wang , Yexin Yang , Zhanghao Wu , Yanmin Qian , and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2020
                                      3. End-To-End Multi-Speaker Speech Recognition With Transformer
                                        Xuankai Chang , Wangyou Zhang , Yanmin Qian , Jonathan Le Roux , and Shinji Watanabe
                                        In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
                                      4. Text Adaptation for Speaker Verification with Speaker-Text Factorized Embeddings
                                        Yexin Yang , Shuai Wang , Xun Gong , Yanmin Qian , and Kai Yu
                                        In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
                                      5. Channel Invariant Speaker Embedding Learning with Joint Multi-Task and Adversarial Training
                                        Zhengyang Chen , Shuai Wang , Yanmin Qian , and Kai Yu
                                        In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
                                      6. Deep Audio-Visual Speech Separation with Attention Mechanism
                                        Chenda Li , and Yanmin Qian
                                        In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
                                      7. Learning Contextual Language Embeddings for Monaural Multi-Talker Speech Recognition
                                        Wangyou Zhang , and Yanmin Qian
                                        In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
                                      8. End-to-End Far-Field Speech Recognition with Unified Dereverberation and Beamforming
                                        Wangyou Zhang , Aswin Shanmugam Subramanian , Xuankai Chang , Shinji Watanabe , and Yanmin Qian
                                        In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
                                      9. Dual-Adversarial Domain Adaptation for Generalized Replay Attack Detection
                                        Hongji Wang , Heinrich Dinkel , Shuai Wang , Yanmin Qian , and Kai Yu
                                        In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
                                      10. Listen, Watch and Understand at the Cocktail Party: Audio-Visual-Contextual Speech Separation
                                        Chenda Li , and Yanmin Qian
                                        In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
                                      11. Multi-Modality Matters: A Performance Leap on VoxCeleb
                                        Zhengyang Chen , Shuai Wang , and Yanmin Qian
                                        In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
                                      12. Adversarial Domain Adaptation for Speaker Verification Using Partially Shared Network
                                        Zhengyang Chen , Shuai Wang , and Yanmin Qian
                                        In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
                                      13. Bi-Encoder Transformer Network for Mandarin-English Code-Switching Speech Recognition Using Mixture of Experts
                                        Yizhou Lu , Mingkun Huang , Hao Li , Jiaqi Guo , and Yanmin Qian
                                        In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
                                      14. End-to-End Speaker-Dependent Voice Activity Detection
                                        Yefei Chen , Shuai Wang , Yanmin Qian , and Kai Yu
                                        CoRR, Oct 2020
                                      15. A CRNN-GRU Based Reinforcement Learning Approach to Audio Captioning
                                        Xuenan Xu , Heinrich Dinkel , Mengyue Wu, and Kai Yu
                                        In Proceedings of 5th the Workshop on Detection and Classification of Acoustic Scenes and Events 2020 (DCASE 2020), Tokyo, Japan (full virtual), November 2-4, 2020 , Oct 2020
                                      16. Multiple Sound Sources Localization from Coarse to Fine
                                        Rui Qian , Di Hu , Heinrich Dinkel , Mengyue Wu, Ning Xu , and Weiyao Lin
                                        In Computer Vision - ECCV 2020 - 16th European Conference, Glasgow, UK, August 23-28, 2020, Proceedings, Part XX , Oct 2020
                                      17. Voice Activity Detection in the Wild via Weakly Supervised Sound Event Detection
                                        Yefei Chen , Heinrich Dinkel , Mengyue Wu, and Kai Yu
                                        In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
                                      18. GPVAD: Towards noise robust voice activity detection via weakly supervised sound event detection
                                        Heinrich Dinkel , Yefei Chen , Mengyue Wu, and Kai Yu
                                        CoRR, Oct 2020
                                      19. Interpreting Hierarchical Linguistic Interactions in DNNs
                                        Die Zhang , Huilin Zhou , Xiaoyi Bao , Da Huo , Ruizhao Chen , Xu Cheng , Hao Zhang , Mengyue Wu, and Quanshi Zhang
                                        CoRR, Oct 2020
                                      20. Towards a new generation of artificial intelligence in China
                                        Fei Wu , Cewu Lu , Mingjie Zhu , Hao Chen , Jun Zhu , Kai Yu, Lei Li , Ming Li , Qianfeng Chen , Xi Li , Xudong Cao , Zhongyuan Wang , Zhengjun Zha , Yueting Zhuang , and Yunhe Pan
                                        Nat. Mach. Intell., Oct 2020
                                      21. Prior Knowledge Driven Label Embedding for Slot Filling in Natural Language Understanding
                                        Su Zhu , Zijian Zhao , Rao Ma , and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2020
                                      22. Dual Learning for Semi-Supervised Natural Language Understanding
                                        Su Zhu , Ruisheng Cao , and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2020
                                      23. Modular End-to-End Automatic Speech Recognition Framework for Acoustic-to-Word Model
                                        Qi Liu , Zhehuai Chen , Hao Li , Mingkun Huang , Yizhou Lu , and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2020
                                      24. Distributed Structured Actor-Critic Reinforcement Learning for Universal Dialogue Management
                                        Zhi Chen , Lu Chen, Xiaoyuan Liu , and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2020
                                      25. Neural Network Language Model Compression With Product Quantization and Soft Binarization
                                        Kai Yu, Rao Ma , Kaiyu Shi , and Qi Liu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2020
                                      26. Schema-Guided Multi-Domain Dialogue State Tracking with Graph Attention Neural Networks
                                        Lu Chen, Boer Lv , Chi Wang , Su Zhu , Bowen Tan , and Kai Yu
                                        In The Thirty-Fourth AAAI Conference on Artificial Intelligence, AAAI 2020, The Thirty-Second Innovative Applications of Artificial Intelligence Conference, IAAI 2020, The Tenth AAAI Symposium on Educational Advances in Artificial Intelligence, EAAI 2020, New York, NY, USA, February 7-12, 2020 , Oct 2020
                                      27. Semi-Supervised Text Simplification with Back-Translation and Asymmetric Denoising Autoencoders
                                        Yanbin Zhao , Lu Chen , Zhi Chen , and Kai Yu
                                        In The Thirty-Fourth AAAI Conference on Artificial Intelligence, AAAI 2020, The Thirty-Second Innovative Applications of Artificial Intelligence Conference, IAAI 2020, The Tenth AAAI Symposium on Educational Advances in Artificial Intelligence, EAAI 2020, New York, NY, USA, February 7-12, 2020 , Oct 2020
                                      28. Line Graph Enhanced AMR-to-Text Generation with Mix-Order Graph Attention Networks
                                        Yanbin Zhao , Lu Chen , Zhi Chen , Ruisheng Cao , Su Zhu , and Kai Yu
                                        In Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics, ACL 2020, Online, July 5-10, 2020 , Oct 2020
                                      29. Neural Graph Matching Networks for Chinese Short Text Matching
                                        Lu Chen, Yanbin Zhao , Boer Lyu , Lesheng Jin , Zhi Chen , Su Zhu , and Kai Yu
                                        In Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics, ACL 2020, Online, July 5-10, 2020 , Oct 2020
                                      30. Unsupervised Dual Paraphrasing for Two-stage Semantic Parsing
                                        Ruisheng Cao , Su Zhu , Chenyu Yang , Chen Liu , Rao Ma , Yanbin Zhao , Lu Chen, and Kai Yu
                                        In Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics, ACL 2020, Online, July 5-10, 2020 , Oct 2020
                                      31. Efficient Context and Schema Fusion Networks for Multi-Domain Dialogue State Tracking
                                        Su Zhu , Jieyu Li , Lu Chen, and Kai Yu
                                        In Findings of the Association for Computational Linguistics: EMNLP 2020, Online Event, 16-20 November 2020 , Oct 2020
                                      32. Duration Robust Weakly Supervised Sound Event Detection
                                        Heinrich Dinkel , and Kai Yu
                                        In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
                                      33. Investigation of Specaugment for Deep Speaker Embedding Learning
                                        Shuai Wang , Johan Rohdin , Oldrich Plchot , Lukás Burget , Kai Yu, and Jan Cernocký
                                        In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
                                      34. Speaker Augmentation for Low Resource Speech Recognition
                                        Chenpeng Du , and Kai Yu
                                        In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
                                      35. Neural Lattice Search for Speech Recognition
                                        Rao Ma , Hao Li , Qi Liu , Lu Chen, and Kai Yu
                                        In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
                                      36. A Hierarchical Tracker for Multi-Domain Dialogue State Tracking
                                        Jieyu Li , Su Zhu , and Kai Yu
                                        In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
                                      37. Addressing the Polysemy Problem in Language Modeling with Attentional Multi-Sense Embeddings
                                        Rao Ma , Lesheng Jin , Qi Liu , Lu Chen, and Kai Yu
                                        In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
                                      38. CODA: Improving Resource Utilization by Slimming and Co-locating DNN and CPU Jobs
                                        Han Zhao , Weihao Cui , Quan Chen , Jingwen Leng , Kai Yu, Deze Zeng , Chao Li , and Minyi Guo
                                        In 40th IEEE International Conference on Distributed Computing Systems, ICDCS 2020, Singapore, November 29 - December 1, 2020 , Oct 2020
                                      39. Jointly Encoding Word Confusion Network and Dialogue Context with BERT for Spoken Language Understanding
                                        Chen Liu , Su Zhu , Zijian Zhao , Ruisheng Cao , Lu Chen, and Kai Yu
                                        In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
                                      40. Memory Attention Neural Network for Multi-domain Dialogue State Tracking
                                        Zihan Xu , Zhi Chen , Lu Chen , Su Zhu , and Kai Yu
                                        In Natural Language Processing and Chinese Computing - 9th CCF International Conference, NLPCC 2020, Zhengzhou, China, October 14-18, 2020, Proceedings, Part I , Oct 2020
                                      41. Robust Spoken Language Understanding with RL-Based Value Error Recovery
                                        Chen Liu , Su Zhu , Lu Chen, and Kai Yu
                                        In Natural Language Processing and Chinese Computing - 9th CCF International Conference, NLPCC 2020, Zhengzhou, China, October 14-18, 2020, Proceedings, Part I , Oct 2020
                                      42. An Investigation on Different Underlying Quantization Schemes for Pre-trained Language Models
                                        Zihan Zhao , Yuncong Liu , Lu Chen, Qi Liu , Rao Ma , and Kai Yu
                                        In Natural Language Processing and Chinese Computing - 9th CCF International Conference, NLPCC 2020, Zhengzhou, China, October 14-18, 2020, Proceedings, Part I , Oct 2020
                                      43. An Investigation on Deep Learning with Beta Stabilizer
                                        Qi Liu , Tian Tan , and Kai Yu
                                        CoRR, Oct 2020
                                      44. Vector Projection Network for Few-shot Slot Tagging in Natural Language Understanding
                                        Su Zhu , Ruisheng Cao , Lu Chen, and Kai Yu
                                        CoRR, Oct 2020
                                      45. Deep Reinforcement Learning for On-line Dialogue State Tracking
                                        Zhi Chen , Lu Chen, Xiang Zhou , and Kai Yu
                                        CoRR, Oct 2020
                                      46. Structured Hierarchical Dialogue Policy with Graph Neural Networks
                                        Zhi Chen , Xiaoyuan Liu , Lu Chen, and Kai Yu
                                        CoRR, Oct 2020
                                      47. Dual Learning for Dialogue State Tracking
                                        Zhi Chen , Lu Chen, Yanbin Zhao , Su Zhu , and Kai Yu
                                        CoRR, Oct 2020
                                      48. CREDIT: Coarse-to-Fine Sequence Generation for Dialogue State Tracking
                                        Zhi Chen , Lu Chen, Zihan Xu , Yanbin Zhao , Su Zhu , and Kai Yu
                                        CoRR, Oct 2020

                                      2019

                                      1. Erratum to: Past review, current progress, and challenges ahead on the cocktail party problem
                                        Yanmin Qian , Chao Weng , Xuankai Chang , Shuai Wang , and Dong Yu
                                        Frontiers Inf. Technol. Electron. Eng., Oct 2019
                                      2. Binary neural networks for speech recognition
                                        Yanmin Qian , and Xu Xiang
                                        Frontiers Inf. Technol. Electron. Eng., Oct 2019
                                      3. Data augmentation using generative adversarial networks for robust speech recognition
                                        Yanmin Qian , Hu Hu , and Tian Tan
                                        Speech Commun., Oct 2019
                                      4. Discriminative Neural Embedding Learning for Short-Duration Text-Independent Speaker Verification
                                        Shuai Wang , Zili Huang , Yanmin Qian , and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2019
                                      5. Margin Matters: Towards More Discriminative Deep Neural Network Embeddings for Speaker Recognition
                                        Xu Xiang , Shuai Wang , Houjun Huang , Yanmin Qian , and Kai Yu
                                        In 2019 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference, APSIPA ASC 2019, Lanzhou, China, November 18-21, 2019 , Oct 2019
                                      6. GANs for Children: A Generative Data Augmentation Strategy for Children Speech Recognition
                                        Peiyao Sheng , Zhuolin Yang , and Yanmin Qian
                                        In IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2019, Singapore, December 14-18, 2019 , Oct 2019
                                      7. MIMO-Speech: End-to-End Multi-Channel Multi-Speaker Speech Recognition
                                        Xuankai Chang , Wangyou Zhang , Yanmin Qian , Jonathan Le Roux , and Shinji Watanabe
                                        In IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2019, Singapore, December 14-18, 2019 , Oct 2019
                                      8. Exploring Model Units and Training Strategies for End-to-End Speech Recognition
                                        Mingkun Huang , Yizhou Lu , Lan Wang , Yanmin Qian , and Kai Yu
                                        In IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2019, Singapore, December 14-18, 2019 , Oct 2019
                                      9. End-to-End Overlapped Speech Detection and Speaker Counting with Raw Waveform
                                        Wangyou Zhang , Man Sun , Lan Wang , and Yanmin Qian
                                        In IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2019, Singapore, December 14-18, 2019 , Oct 2019
                                      10. Knowledge Distillation for Small Foot-print Deep Speaker Embedding
                                        Shuai Wang , Yexin Yang , Tianzhe Wang , Yanmin Qian , and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2019, Brighton, United Kingdom, May 12-17, 2019 , Oct 2019
                                      11. End-to-end Monaural Multi-speaker ASR System without Pretraining
                                        Xuankai Chang , Yanmin Qian , Kai Yu, and Shinji Watanabe
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2019, Brighton, United Kingdom, May 12-17, 2019 , Oct 2019
                                      12. The SJTU Robust Anti-Spoofing System for the ASVspoof 2019 Challenge
                                        Yexin Yang , Hongji Wang , Heinrich Dinkel , Zhengyang Chen , Shuai Wang , Yanmin Qian , and Kai Yu
                                        In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
                                      13. On the Usage of Phonetic Information for Text-Independent Speaker Embedding Extraction
                                        Shuai Wang , Johan Rohdin , Lukás Burget , Oldrich Plchot , Yanmin Qian , Kai Yu, and Jan Cernocký
                                        In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
                                      14. Data Augmentation Using Variational Autoencoder for Embedding Based Speaker Verification
                                        Zhanghao Wu , Shuai Wang , Yanmin Qian , and Kai Yu
                                        In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
                                      15. Joint Decoding of CTC Based Systems for Speech Recognition
                                        Jiaqi Guo , Yongbin You , Yanmin Qian , and Kai Yu
                                        In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
                                      16. Knowledge Distillation for End-to-End Monaural Multi-Talker ASR System
                                        Wangyou Zhang , Xuankai Chang , and Yanmin Qian
                                        In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
                                      17. Robust DOA Estimation Based on Convolutional Neural Network and Time-Frequency Masking
                                        Wangyou Zhang , Ying Zhou , and Yanmin Qian
                                        In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
                                      18. Cross-Domain Replay Spoofing Attack Detection Using Domain Adversarial Training
                                        Hongji Wang , Heinrich Dinkel , Shuai Wang , Yanmin Qian , and Kai Yu
                                        In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
                                      19. Prosody Usage Optimization for Children Speech Recognition with Zero Resource Children Speech
                                        Chenda Li , and Yanmin Qian
                                        In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
                                      20. Audio Caption: Listen and Tell
                                        Mengyue Wu, Heinrich Dinkel , and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2019, Brighton, United Kingdom, May 12-17, 2019 , Oct 2019
                                      21. Text-based Depression Detection: What Triggers An Alert
                                        Heinrich Dinkel , Mengyue Wu, and Kai Yu
                                        CoRR, Oct 2019
                                      22. What does a Car-ssette tape tell?
                                        Xuenan Xu , Heinrich Dinkel , Mengyue Wu, and Kai Yu
                                        CoRR, Oct 2019
                                      23. AgentGraph: Toward Universal Dialogue Management With Structured Deep Reinforcement Learning
                                        Lu Chen , Zhi Chen , Bowen Tan , Sishan Long , Milica Gasic , and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2019
                                      24. Semantic Parsing with Dual Learning
                                        Ruisheng Cao , Su Zhu , Chen Liu , Jieyu Li , and Kai Yu
                                        In Proceedings of the 57th Conference of the Association for Computational Linguistics, ACL 2019, Florence, Italy, July 28- August 2, 2019, Volume 1: Long Papers , Oct 2019
                                      25. Highly Efficient Neural Network Language Model Compression Using Soft Binarization Training
                                        Rao Ma , Qi Liu , and Kai Yu
                                        In IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2019, Singapore, December 14-18, 2019 , Oct 2019
                                      26. Data Augmentation with Atomic Templates for Spoken Language Understanding
                                        Zijian Zhao , Su Zhu , and Kai Yu
                                        In Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing and the 9th International Joint Conference on Natural Language Processing, EMNLP-IJCNLP 2019, Hong Kong, China, November 3-7, 2019 , Oct 2019
                                      27. A Hierarchical Decoding Model for Spoken Language Understanding from Unaligned Data
                                        Zijian Zhao , Su Zhu , and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2019, Brighton, United Kingdom, May 12-17, 2019 , Oct 2019
                                      28. CATSLU: The 1st Chinese Audio-Textual Spoken Language Understanding Challenge
                                        Su Zhu , Zijian Zhao , Tiejun Zhao , Chengqing Zong , and Kai Yu
                                        In International Conference on Multimodal Interaction, ICMI 2019, Suzhou, China, October 14-18, 2019 , Oct 2019
                                      29. Robust Spoken Language Understanding with Acoustic and Domain Knowledge
                                        Hao Li , Chen Liu , Su Zhu , and Kai Yu
                                        In International Conference on Multimodal Interaction, ICMI 2019, Suzhou, China, October 14-18, 2019 , Oct 2019
                                      30. Cross Aggregation of Multi-head Attention for Neural Machine Translation
                                        Juncheng Cao , Hai Zhao , and Kai Yu
                                        In Natural Language Processing and Chinese Computing - 8th CCF International Conference, NLPCC 2019, Dunhuang, China, October 9-14, 2019, Proceedings, Part I , Oct 2019
                                      31. International Conference on Multimodal Interaction, ICMI 2019, Suzhou, China, October 14-18, 2019
                                        Oct 2019

                                      2018

                                      1. Past review, current progress, and challenges ahead on the cocktail party problem
                                        Yanmin Qian , Chao Weng , Xuankai Chang , Shuai Wang , and Dong Yu
                                        Frontiers Inf. Technol. Electron. Eng., Oct 2018
                                      2. Erratum to: Past review, current progress, and challenges ahead on the cocktail party problem
                                        Yanmin Qian , Chao Weng , Xuankai Chang , Shuai Wang , and Dong Yu
                                        Frontiers Inf. Technol. Electron. Eng., Oct 2018
                                      3. Sequence discriminative training for deep learning based acoustic keyword spotting
                                        Zhehuai Chen , Yanmin Qian , and Kai Yu
                                        Speech Commun., Oct 2018
                                      4. Single-channel multi-talker speech recognition with permutation invariant training
                                        Yanmin Qian , Xuankai Chang , and Dong Yu
                                        Speech Commun., Oct 2018
                                      5. Adaptive Very Deep Convolutional Residual Network for Noise Robust Speech Recognition
                                        Tian Tan , Yanmin Qian , Hu Hu , Ying Zhou , Wen Ding , and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2018
                                      6. Investigating Raw Wave Deep Neural Networks for End-to-End Speaker Spoofing Detection
                                        Heinrich Dinkel , Yanmin Qian , and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2018
                                      7. Robust Mask Estimation By Integrating Neural Network-Based and Clustering-Based Approaches for Adaptive Acoustic Beamforming
                                        Ying Zhou , and Yanmin Qian
                                        In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
                                      8. Knowledge Transfer in Permutation Invariant Training for Single-Channel Multi-Talker Speech Recognition
                                        Tian Tan , Yanmin Qian , and Dong Yu
                                        In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
                                      9. Joint I-Vector with End-to-End System for Short Duration Text-Independent Speaker Verification
                                        Zili Huang , Shuai Wang , and Yanmin Qian
                                        In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
                                      10. Generative Adversarial Networks Based Data Augmentation for Noise Robust Speech Recognition
                                        Hu Hu , Tian Tan , and Yanmin Qian
                                        In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
                                      11. Focal Kl-Divergence Based Dilated Convolutional Neural Networks for Co-Channel Speaker Identification
                                        Shuai Wang , Yanmin Qian , and Kai Yu
                                        In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
                                      12. Noise Robust Speech Recognition on Aurora4 by Humans and Machines
                                        Yanmin Qian , Tian Tan , Hu Hu , and Qi Liu
                                        In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
                                      13. Fast Adaptation on Deepmixture Generative Network Based Acoustic Modeling
                                        Wen Ding , Tian Tan , and Yanmin Qian
                                        In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
                                      14. Adaptive Permutation Invariant Training with Auxiliary Information for Monaural Multi-Talker Speech Recognition
                                        Xuankai Chang , Yanmin Qian , and Dong Yu
                                        In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
                                      15. Permutation Invariant Training of Generative Adversarial Network for Monaural Speech Separation
                                        Lianwu Chen , Meng Yu , Yanmin Qian , Dan Su , and Dong Yu
                                        In Interspeech 2018, 19th Annual Conference of the International Speech Communication Association, Hyderabad, India, 2-6 September 2018 , Oct 2018
                                      16. Deep Extractor Network for Target Speaker Recovery from Single Channel Speech Mixtures
                                        Jun Wang , Jie Chen , Dan Su , Lianwu Chen , Meng Yu , Yanmin Qian , and Dong Yu
                                        In Interspeech 2018, 19th Annual Conference of the International Speech Communication Association, Hyderabad, India, 2-6 September 2018 , Oct 2018
                                      17. Monaural Multi-Talker Speech Recognition with Attention Mechanism and Gated Convolutional Networks
                                        Xuankai Chang , Yanmin Qian , and Dong Yu
                                        In Interspeech 2018, 19th Annual Conference of the International Speech Communication Association, Hyderabad, India, 2-6 September 2018 , Oct 2018
                                      18. Knowledge Distillation for Sequence Model
                                        Mingkun Huang , Yongbin You , Zhehuai Chen , Yanmin Qian , and Kai Yu
                                        In Interspeech 2018, 19th Annual Conference of the International Speech Communication Association, Hyderabad, India, 2-6 September 2018 , Oct 2018
                                      19. Covariance Based Deep Feature for Text-Dependent Speaker Verification
                                        Shuai Wang , Heinrich Dinkel , Yanmin Qian , and Kai Yu
                                        In Intelligence Science and Big Data Engineering - 8th International Conference, IScIDE 2018, Lanzhou, China, August 18-19, 2018, Revised Selected Papers , Oct 2018
                                      20. Data Augmentation using Conditional Generative Adversarial Networks for Robust Speech Recognition
                                        Peiyao Sheng , Zhuolin Yang , Hu Hu , Tian Tan , and Yanmin Qian
                                        In 11th International Symposium on Chinese Spoken Language Processing, ISCSLP 2018, Taipei City, Taiwan, November 26-29, 2018 , Oct 2018
                                      21. Deep Discriminant Analysis for i-vector Based Robust Speaker Recognition
                                        Shuai Wang , Zili Huang , Yanmin Qian , and Kai Yu
                                        In 11th International Symposium on Chinese Spoken Language Processing, ISCSLP 2018, Taipei City, Taiwan, November 26-29, 2018 , Oct 2018
                                      22. Generative Adversarial Networks based X-vector Augmentation for Robust Probabilistic Linear Discriminant Analysis in Speaker Verification
                                        Yexin Yang , Shuai Wang , Man Sun , Yanmin Qian , and Kai Yu
                                        In 11th International Symposium on Chinese Spoken Language Processing, ISCSLP 2018, Taipei City, Taiwan, November 26-29, 2018 , Oct 2018
                                      23. Rich Short Text Conversation Using Semantic-Key-Controlled Sequence Generation
                                        Kai Yu, Zijian Zhao , Xueyang Wu , Hongtao Lin , and Xuan Liu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2018
                                      24. Structured Dialogue Policy with Graph Neural Networks
                                        Lu Chen, Bowen Tan , Sishan Long , and Kai Yu
                                        In Proceedings of the 27th International Conference on Computational Linguistics, COLING 2018, Santa Fe, New Mexico, USA, August 20-26, 2018 , Oct 2018
                                      25. Towards Universal Dialogue State Tracking
                                        Liliang Ren , Kaige Xie , Lu Chen, and Kai Yu
                                        In Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing, Brussels, Belgium, October 31 - November 4, 2018 , Oct 2018
                                      26. On Modular Training of Neural Acoustics-to-Word Model for LVCSR
                                        Zhehuai Chen , Qi Liu , Hao Li , and Kai Yu
                                        In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
                                      27. Semi-Supervised Training Using Adversarial Multi-Task Learning for Spoken Language Understanding
                                        Ouyu Lan , Su Zhu , and Kai Yu
                                        In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
                                      28. Policy Adaptation for Deep Reinforcement Learning-Based Dialogue Management
                                        Lu Chen, Cheng Chang , Zhi Chen , Bowen Tan , Milica Gasic , and Kai Yu
                                        In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
                                      29. Robust Spoken Language Understanding with Unsupervised ASR-Error Adaptation
                                        Su Zhu , Ouyu Lan , and Kai Yu
                                        In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
                                      30. MLN: Moment localization Network and Samples Selection for Moment Retrieval
                                        Bo Huang , Ya Zhang , and Kai Yu
                                        In Proceedings of the 2nd International Conference on Video and Image Processing, ICVIP 2018, Hong Kong, China, December 29-31, 2018 , Oct 2018
                                      31. Angular Softmax for Short-Duration Text-independent Speaker Verification
                                        Zili Huang , Shuai Wang , and Kai Yu
                                        In Interspeech 2018, 19th Annual Conference of the International Speech Communication Association, Hyderabad, India, 2-6 September 2018 , Oct 2018
                                      32. Joint Spoken Language Understanding and Domain Adaptive Language Modeling
                                        Huifeng Zhang , Su Zhu , Shuai Fan , and Kai Yu
                                        In Intelligence Science and Big Data Engineering - 8th International Conference, IScIDE 2018, Lanzhou, China, August 18-19, 2018, Revised Selected Papers , Oct 2018
                                      33. Binarized LSTM Language Model
                                        Xuan Liu , Di Cao , and Kai Yu
                                        In Proceedings of the 2018 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, NAACL-HLT 2018, New Orleans, Louisiana, USA, June 1-6, 2018, Volume 1 (Long Papers) , Oct 2018
                                      34. Cost-Sensitive Active Learning for Dialogue State Tracking
                                        Kaige Xie , Cheng Chang , Liliang Ren , Lu Chen, and Kai Yu
                                        In Proceedings of the 19th Annual SIGdial Meeting on Discourse and Dialogue, Melbourne, Australia, July 12-14, 2018 , Oct 2018
                                      35. Concept Transfer Learning for Adaptive Language Understanding
                                        Su Zhu , and Kai Yu
                                        In Proceedings of the 19th Annual SIGdial Meeting on Discourse and Dialogue, Melbourne, Australia, July 12-14, 2018 , Oct 2018
                                      36. Intelligence Science and Big Data Engineering - 8th International Conference, IScIDE 2018, Lanzhou, China, August 18-19, 2018, Revised Selected Papers
                                        Oct 2018

                                      2017

                                      1. Phone Synchronous Speech Recognition With CTC Lattices
                                        Zhehuai Chen , Yimeng Zhuang , Yanmin Qian , and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2017
                                      2. Deep Feature Engineering for Noise Robust Spoofing Detection
                                        Yanmin Qian , Nanxin Chen , Heinrich Dinkel , and Zhizheng Wu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2017
                                      3. Integrating online i-vector into GMM-UBM for text-dependent speaker verification
                                        Xiaowei Jiang , Shuai Wang , Xu Xiang , and Yanmin Qian
                                        In 2017 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference, APSIPA ASC 2017, Kuala Lumpur, Malaysia, December 12-15, 2017 , Oct 2017
                                      4. Future vector enhanced LSTM language model for LVCSR
                                        Qi Liu , Yanmin Qian , and Kai Yu
                                        In 2017 IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2017, Okinawa, Japan, December 16-20, 2017 , Oct 2017
                                      5. Multi-view LSTM Language Model with Word-Synchronized Auxiliary Feature for LVCSR
                                        Yue Wu , Tianxing He , Zhehuai Chen , Yanmin Qian , and Kai Yu
                                        In Chinese Computational Linguistics and Natural Language Processing Based on Naturally Annotated Big Data - 16th China National Conference, CCL 2017, - and - 5th International Symposium, NLP-NABD 2017, Nanjing, China, October 13-15, 2017, Proceedings , Oct 2017
                                      6. End-to-end spoofing detection with raw waveform CLDNNS
                                        Heinrich Dinkel , Nanxin Chen , Yanmin Qian , and Kai Yu
                                        In 2017 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2017, New Orleans, LA, USA, March 5-9, 2017 , Oct 2017
                                      7. Small-footprint convolutional neural network for spoofing detection
                                        Heinrich Dinkel , Yanmin Qian , and Kai Yu
                                        In 2017 International Joint Conference on Neural Networks, IJCNN 2017, Anchorage, AK, USA, May 14-19, 2017 , Oct 2017
                                      8. Binary Deep Neural Networks for Speech Recognition
                                        Xu Xiang , Yanmin Qian , and Kai Yu
                                        In Interspeech 2017, 18th Annual Conference of the International Speech Communication Association, Stockholm, Sweden, August 20-24, 2017 , Oct 2017
                                      9. What Does the Speaker Embedding Encode?
                                        Shuai Wang , Yanmin Qian , and Kai Yu
                                        In Interspeech 2017, 18th Annual Conference of the International Speech Communication Association, Stockholm, Sweden, August 20-24, 2017 , Oct 2017
                                      10. Recognizing Multi-Talker Speech with Permutation Invariant Training
                                        Dong Yu , Xuankai Chang , and Yanmin Qian
                                        In Interspeech 2017, 18th Annual Conference of the International Speech Communication Association, Stockholm, Sweden, August 20-24, 2017 , Oct 2017
                                      11. A Unified Confidence Measure Framework Using Auxiliary Normalization Graph
                                        Zhehuai Chen , Yanmin Qian , and Kai Yu
                                        In Intelligence Science and Big Data Engineering - 7th International Conference, IScIDE 2017, Dalian, China, September 22-23, 2017, Proceedings , Oct 2017
                                      12. Adaptation of Deep Neural Network Acoustic Models for Robust Automatic Speech Recognition
                                        Khe Chai Sim , Yanmin Qian , Gautam Mantena , Lahiru Samarakoon , Souvik Kundu , and Tian Tan
                                        In New Era for Robust Speech Recognition, Exploiting Deep Learning , Oct 2017
                                      13. On-line Dialogue Policy Learning with Companion Teaching
                                        Lu Chen, Runzhe Yang , Cheng Chang , Zihao Ye , Xiang Zhou , and Kai Yu
                                        In Proceedings of the 15th Conference of the European Chapter of the Association for Computational Linguistics, EACL 2017, Valencia, Spain, April 3-7, 2017, Volume 2: Short Papers , Oct 2017
                                      14. Affordable On-line Dialogue Policy Learning
                                        Cheng Chang , Runzhe Yang , Lu Chen, Xiang Zhou , and Kai Yu
                                        In Proceedings of the 2017 Conference on Empirical Methods in Natural Language Processing, EMNLP 2017, Copenhagen, Denmark, September 9-11, 2017 , Oct 2017
                                      15. Agent-Aware Dropout DQN for Safe and Efficient On-line Dialogue Policy Learning
                                        Lu Chen, Xiang Zhou , Cheng Chang , Runzhe Yang , and Kai Yu
                                        In Proceedings of the 2017 Conference on Empirical Methods in Natural Language Processing, EMNLP 2017, Copenhagen, Denmark, September 9-11, 2017 , Oct 2017
                                      16. Confidence measures for CTC-based phone synchronous decoding
                                        Zhehuai Chen , Yimeng Zhuang , and Kai Yu
                                        In 2017 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2017, New Orleans, LA, USA, March 5-9, 2017 , Oct 2017
                                      17. Encoder-decoder with focus-mechanism for sequence labelling based spoken language understanding
                                        Su Zhu , and Kai Yu
                                        In 2017 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2017, New Orleans, LA, USA, March 5-9, 2017 , Oct 2017
                                      18. Discrete Duration Model for Speech Synthesis
                                        Bo Chen , Tianling Bian , and Kai Yu
                                        In Interspeech 2017, 18th Annual Conference of the International Speech Communication Association, Stockholm, Sweden, August 20-24, 2017 , Oct 2017
                                      19. Deep Attentive Structured Language Model Based on LSTM
                                        Di Cao , and Kai Yu
                                        In Intelligence Science and Big Data Engineering - 7th International Conference, IScIDE 2017, Dalian, China, September 22-23, 2017, Proceedings , Oct 2017
                                      20. splab at the NTCIR-13 STC-2 Task
                                        Xuan Liu , Xueyang Wu , Ruinian Chen , Zijian Zhao , Hongtao Lin , and Kai Yu
                                        In The 13th NTCIR Conference, Evaluation of Information Access Technologies, National Center of Sciences, Tokyo, Japan, December 5-8, 2017 , Oct 2017

                                      2016

                                      1. Deep features for automatic spoofing detection
                                        Yanmin Qian , Nanxin Chen , and Kai Yu
                                        Speech Commun., Oct 2016
                                      2. Cluster Adaptive Training for Deep Neural Network Based Acoustic Model
                                        Tian Tan , Yanmin Qian , and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2016
                                      3. Neural Network Based Multi-Factor Aware Joint Training for Robust Speech Recognition
                                        Yanmin Qian , Tian Tan , and Dong Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2016
                                      4. Very Deep Convolutional Neural Networks for Noise Robust Speech Recognition
                                        Yanmin Qian , Mengxiao Bi , Tian Tan , and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2016
                                      5. Overview of BTAS 2016 speaker anti-spoofing competition
                                        Pavel Korshunov , Sébastien Marcel , Hannah Muckenhirn , André R. Gonçalves , A. G. Souza Mello , Ricardo Paranhos Velloso Violato , Flávio Olmos Simões , M. U. Neto , Marcus Assis Angeloni , José Augusto Stuchi , Heinrich Dinkel , Nanxin Chen , Yanmin Qian , Dipjyoti Paul , Goutam Saha , and Md. Sahidullah
                                        In 8th IEEE International Conference on Biometrics Theory, Applications and Systems, BTAS 2016, Niagara Falls, NY, USA, September 6-9, 2016 , Oct 2016
                                      6. Joint acoustic factor learning for robust deep neural network based automatic speech recognition
                                        Souvik Kundu , Gautam Mantena , Yanmin Qian , Tian Tan , Marc Delcroix , and Khe Chai Sim
                                        In 2016 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2016, Shanghai, China, March 20-25, 2016 , Oct 2016
                                      7. Speaker-aware training of LSTM-RNNS for acoustic modelling
                                        Tian Tan , Yanmin Qian , Dong Yu , Souvik Kundu , Liang Lu , Khe Chai Sim , Xiong Xiao , and Yu Zhang
                                        In 2016 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2016, Shanghai, China, March 20-25, 2016 , Oct 2016
                                      8. Improved DNN-based segmentation for multi-genre broadcast audio
                                        Linlin Wang , Chao Zhang , Philip C. Woodland , Mark J. F. Gales , Panagiota Karanasou , Pierre Lanchantin , Xunying Liu , and Yanmin Qian
                                        In 2016 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2016, Shanghai, China, March 20-25, 2016 , Oct 2016
                                      9. An investigation into using parallel data for far-field speech recognition
                                        Yanmin Qian , Tian Tan , and Dong Yu
                                        In 2016 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2016, Shanghai, China, March 20-25, 2016 , Oct 2016
                                      10. Integrated adaptation with multi-factor joint-learning for far-field speech recognition
                                        Yanmin Qian , Tian Tan , Dong Yu , and Yu Zhang
                                        In 2016 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2016, Shanghai, China, March 20-25, 2016 , Oct 2016
                                      11. Unrestricted Vocabulary Keyword Spotting Using LSTM-CTC
                                        Yimeng Zhuang , Xuankai Chang , Yanmin Qian , and Kai Yu
                                        In Interspeech 2016, 17th Annual Conference of the International Speech Communication Association, San Francisco, CA, USA, September 8-12, 2016 , Oct 2016
                                      12. Multi-task joint-learning for robust voice activity detection
                                        Yimeng Zhuang , Sibo Tong , Maofan Yin , Yanmin Qian , and Kai Yu
                                        In 10th International Symposium on Chinese Spoken Language Processing, ISCSLP 2016, Tianjin, China, October 17-20, 2016 , Oct 2016
                                      13. Very deep convolutional neural networks for robust speech recognition
                                        Yanmin Qian , and Philip C. Woodland
                                        In 2016 IEEE Spoken Language Technology Workshop, SLT 2016, San Diego, CA, USA, December 13-16, 2016 , Oct 2016
                                      14. Evolvable dialogue state tracking for statistical dialogue management
                                        Kai YuLu Chen, Kai Sun , Qizhe Xie , and Su Zhu
                                        Frontiers Comput. Sci., Oct 2016
                                      15. Discriminatively trained joint speaker and environment representations for adaptation of deep neural network acoustic models
                                        Maofan Yin , Sunil Sivadas , Kai Yu, and Bin Ma
                                        In 2016 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2016, Shanghai, China, March 20-25, 2016 , Oct 2016
                                      16. A comparative study of robustness of deep learning approaches for VAD
                                        Sibo Tong , Hao Gu , and Kai Yu
                                        In 2016 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2016, Shanghai, China, March 20-25, 2016 , Oct 2016
                                      17. Phone Synchronous Decoding with CTC Lattice
                                        Zhehuai Chen , Wei Deng , Tao Xu , and Kai Yu
                                        In Interspeech 2016, 17th Annual Conference of the International Speech Communication Association, San Francisco, CA, USA, September 8-12, 2016 , Oct 2016
                                      18. Hybrid Dialogue State Tracking for Real World Human-to-Human Dialogues
                                        Kai Sun , Su Zhu , Lu Chen, Siqiu Yao , Xueyang Wu , and Kai Yu
                                        In Interspeech 2016, 17th Annual Conference of the International Speech Communication Association, San Francisco, CA, USA, September 8-12, 2016 , Oct 2016
                                      19. On training bi-directional neural network language model with noise contrastive estimation
                                        Tianxing He , Yu Zhang , Jasha Droppo , and Kai Yu
                                        In 10th International Symposium on Chinese Spoken Language Processing, ISCSLP 2016, Tianjin, China, October 17-20, 2016 , Oct 2016
                                      20. Rich punctuations prediction using large-scale deep learning
                                        Xueyang Wu , Su Zhu , Yue Wu , and Kai Yu
                                        In 10th International Symposium on Chinese Spoken Language Processing, ISCSLP 2016, Tianjin, China, October 17-20, 2016 , Oct 2016
                                      21. Directed automatic speech transcription error correction using bidirectional LSTM
                                        Da Zheng , Zhehuai Chen , Yue Wu , and Kai Yu
                                        In 10th International Symposium on Chinese Spoken Language Processing, ISCSLP 2016, Tianjin, China, October 17-20, 2016 , Oct 2016
                                      22. The splab at the NTCIR-12 Short Text Conversation Task
                                        Ke Wu , Xuan Liu , and Kai Yu
                                        In Proceedings of the 12th NTCIR Conference on Evaluation of Information Access Technologies, National Center of Sciences, Tokyo, Japan, June 7-10, 2016 , Oct 2016

                                      2015

                                      1. Deep feature for text-dependent speaker verification
                                        Yuan Liu , Yanmin Qian , Nanxin Chen , Tianfan Fu , Ya Zhang , and Kai Yu
                                        Speech Commun., Oct 2015
                                      2. Multi-task joint-learning of deep neural networks for robust speech recognition
                                        Yanmin Qian , Maofan Yin , Yongbin You , and Kai Yu
                                        In 2015 IEEE Workshop on Automatic Speech Recognition and Understanding, ASRU 2015, Scottsdale, AZ, USA, December 13-17, 2015 , Oct 2015
                                      3. Cambridge university transcription systems for the multi-genre broadcast challenge
                                        Philip C. Woodland , Xunying Liu , Yanmin Qian , Chao Zhang , Mark J. F. Gales , Penny Karanasou , Pierre Lanchantin , and Linlin Wang
                                        In 2015 IEEE Workshop on Automatic Speech Recognition and Understanding, ASRU 2015, Scottsdale, AZ, USA, December 13-17, 2015 , Oct 2015
                                      4. The development of the cambridge university alignment systems for the multi-genre broadcast challenge
                                        Pierre Lanchantin , Mark J. F. Gales , Penny Karanasou , Xunying Liu , Yanmin Qian , Linlin Wang , Philip C. Woodland , and Chao Zhang
                                        In 2015 IEEE Workshop on Automatic Speech Recognition and Understanding, ASRU 2015, Scottsdale, AZ, USA, December 13-17, 2015 , Oct 2015
                                      5. Speaker diarisation and longitudinal linking in multi-genre broadcast data
                                        Penny Karanasou , Mark J. F. Gales , Pierre Lanchantin , Xunying Liu , Yanmin Qian , Linlin Wang , Philip C. Woodland , and Chao Zhang
                                        In 2015 IEEE Workshop on Automatic Speech Recognition and Understanding, ASRU 2015, Scottsdale, AZ, USA, December 13-17, 2015 , Oct 2015
                                      6. Local trajectory based speech enhancement for robust speech recognition with deep neural network
                                        Yongbin You , Yanmin Qian , and Kai Yu
                                        In IEEE China Summit and International Conference on Signal and Information Processing, ChinaSIP 2015, Chengdu, China, July 12-15, 2015 , Oct 2015
                                      7. An investigation on DNN-derived bottleneck features for GMM-HMM based robust speech recognition
                                        Yongbin You , Yanmin Qian , Tianxing He , and Kai Yu
                                        In IEEE China Summit and International Conference on Signal and Information Processing, ChinaSIP 2015, Chengdu, China, July 12-15, 2015 , Oct 2015
                                      8. Cluster adaptive training for deep neural network
                                        Tian Tan , Yanmin Qian , Maofan Yin , Yimeng Zhuang , and Kai Yu
                                        In 2015 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2015, South Brisbane, Queensland, Australia, April 19-24, 2015 , Oct 2015
                                      9. A novel static parameter calculation method for model compensation
                                        Suliang Bu , Yunxin Zhao , Yanmin Qian , and Kai Yu
                                        In 2015 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2015, South Brisbane, Queensland, Australia, April 19-24, 2015 , Oct 2015
                                      10. Recurrent neural network language model with structured word embeddings for speech recognition
                                        Tianxing He , Xu Xiang , Yanmin Qian , and Kai Yu
                                        In 2015 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2015, South Brisbane, Queensland, Australia, April 19-24, 2015 , Oct 2015
                                      11. Automatic model redundancy reduction for fast back-propagation for deep neural networks in speech recognition
                                        Yanmin Qian , Tianxing He , Wei Deng , and Kai Yu
                                        In 2015 International Joint Conference on Neural Networks, IJCNN 2015, Killarney, Ireland, July 12-17, 2015 , Oct 2015
                                      12. Multi-task learning for text-dependent speaker verification
                                        Nanxin Chen , Yanmin Qian , and Kai Yu
                                        In INTERSPEECH 2015, 16th Annual Conference of the International Speech Communication Association, Dresden, Germany, September 6-10, 2015 , Oct 2015
                                      13. Robust deep feature for spoofing detection - the SJTU system for ASVspoof 2015 challenge
                                        Nanxin Chen , Yanmin Qian , Heinrich Dinkel , Bo Chen , and Kai Yu
                                        In INTERSPEECH 2015, 16th Annual Conference of the International Speech Communication Association, Dresden, Germany, September 6-10, 2015 , Oct 2015
                                      14. Very deep convolutional neural networks for LVCSR
                                        Mengxiao Bi , Yanmin Qian , and Kai Yu
                                        In INTERSPEECH 2015, 16th Annual Conference of the International Speech Communication Association, Dresden, Germany, September 6-10, 2015 , Oct 2015
                                      15. Paragraph vector based topic model for language model adaptation
                                        Wengong Jin , Tianxing He , Yanmin Qian , and Kai Yu
                                        In INTERSPEECH 2015, 16th Annual Conference of the International Speech Communication Association, Dresden, Germany, September 6-10, 2015 , Oct 2015
                                      16. Constrained Markov Bayesian Polynomial for Efficient Dialogue State Tracking
                                        Kai Yu, Kai Sun , Lu Chen , and Su Zhu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2015
                                      17. An investigation of context clustering for statistical speech synthesis with deep neural network
                                        Bo Chen , Zhehuai Chen , Jiachen Xu , and Kai Yu
                                        In INTERSPEECH 2015, 16th Annual Conference of the International Speech Communication Association, Dresden, Germany, September 6-10, 2015 , Oct 2015
                                      18. Recurrent Polynomial Network for Dialogue State Tracking with Mismatched Semantic Parsers
                                        Qizhe Xie , Kai Sun , Su Zhu , Lu Chen, and Kai Yu
                                        In Proceedings of the SIGDIAL 2015 Conference, The 16th Annual Meeting of the Special Interest Group on Discourse and Dialogue, 2-4 September 2015, Prague, Czech Republic , Oct 2015
                                      19. Hyper-parameter Optimisation of Gaussian Process Reinforcement Learning for Statistical Dialogue Management
                                        Lu Chen, Pei-Hao Su , and Milica Gasic
                                        In Proceedings of the SIGDIAL 2015 Conference, The 16th Annual Meeting of the Special Interest Group on Discourse and Dialogue, 2-4 September 2015, Prague, Czech Republic , Oct 2015

                                      2014

                                      1. Stochastic data sweeping for fast DNN training
                                        Wei Deng , Yanmin Qian , Yuchen Fan , Tianfan Fu , and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2014, Florence, Italy, May 4-9, 2014 , Oct 2014
                                      2. Reshaping deep neural network for fast decoding by node-pruning
                                        Tianxing He , Yuchen Fan , Yanmin Qian , Tian Tan , and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2014, Florence, Italy, May 4-9, 2014 , Oct 2014
                                      3. Second order vector taylor series based robust speech recognition
                                        Suliang Bu , Yanmin Qian , Khe Chai Sim , Yongbin You , and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2014, Florence, Italy, May 4-9, 2014 , Oct 2014
                                      4. Speaker verification with deep features
                                        Yuan Liu , Tianfan Fu , Yuchen Fan , Yanmin Qian , and Kai Yu
                                        In 2014 International Joint Conference on Neural Networks, IJCNN 2014, Beijing, China, July 6-11, 2014 , Oct 2014
                                      5. Tandem deep features for text-dependent speaker verification
                                        Tianfan Fu , Yanmin Qian , Yuan Liu , and Kai Yu
                                        In INTERSPEECH 2014, 15th Annual Conference of the International Speech Communication Association, Singapore, September 14-18, 2014 , Oct 2014
                                      6. A novel dynamic parameters calculation approach for model compensation
                                        Suliang Bu , Yanmin Qian , and Kai Yu
                                        In INTERSPEECH 2014, 15th Annual Conference of the International Speech Communication Association, Singapore, September 14-18, 2014 , Oct 2014
                                      7. Acoustic emotion recognition using deep neural network
                                        Jianwei Niu , Yanmin Qian , and Kai Yu
                                        In The 9th International Symposium on Chinese Spoken Language Processing, Singapore, September 12-14, 2014 , Oct 2014
                                      8. The SJTU System for Dialog State Tracking Challenge 2
                                        Kai Sun , Lu Chen , Su Zhu , and Kai Yu
                                        In Proceedings of the SIGDIAL 2014 Conference, The 15th Annual Meeting of the Special Interest Group on Discourse and Dialogue, 18-20 June 2014, Philadelphia, PA, USA , Oct 2014
                                      9. A generalized rule based tracker for dialogue state tracking
                                        Kai Sun , Lu Chen , Su Zhu , and Kai Yu
                                        In 2014 IEEE Spoken Language Technology Workshop, SLT 2014, South Lake Tahoe, NV, USA, December 7-10, 2014 , Oct 2014
                                      10. Semantic parser enhancement for dialogue domain extension with little data
                                        Su Zhu , Lu Chen, Kai Sun , Da Zheng , and Kai Yu
                                        In 2014 IEEE Spoken Language Technology Workshop, SLT 2014, South Lake Tahoe, NV, USA, December 7-10, 2014 , Oct 2014

                                      2013

                                      1. Combination of data borrowing strategies for low-resource LVCSR
                                        Yanmin Qian , Kai Yu, and Jia Liu
                                        In 2013 IEEE Workshop on Automatic Speech Recognition and Understanding, Olomouc, Czech Republic, December 8-12, 2013 , Oct 2013
                                      2. MLP-HMM two-stage unsupervised training for low-resource languages on conversational telephone speech recognition
                                        Yanmin Qian , and Jia Liu
                                        In INTERSPEECH 2013, 14th Annual Conference of the International Speech Communication Association, Lyon, France, August 25-29, 2013 , Oct 2013
                                      3. A New Word Language Model Evaluation Metric for Character Based Languages
                                        Peilu Wang , Ruihua Sun , Hai Zhao , and Kai Yu
                                        In Chinese Computational Linguistics and Natural Language Processing Based on Naturally Annotated Big Data - 12th China National Conference, CCL 2013 and First International Symposium, NLP-NABD 2013, Suzhou, China, October 10-12, 2013. Proceedings , Oct 2013

                                      2012

                                      1. Introduction to the Issue on Advances in Spoken Dialogue Systems and Mobile Interface
                                        Jason D. Williams , Kai Yu, Brahim Chaib-draa , Oliver Lemon , Roberto Pieraccini , Olivier Pietquin , Pascal Poupart , and Steve J. Young
                                        IEEE J. Sel. Top. Signal Process., Oct 2012
                                      2. ICMI’12 grand challenge: haptic voice recognition
                                        Khe Chai Sim , Shengdong Zhao , Kai Yu, and Hank Liao
                                        In International Conference on Multimodal Interaction, ICMI ’12, Santa Monica, CA, USA, October 22-26, 2012 , Oct 2012
                                      3. Development of the 2012 SJTU HVR system
                                        Hainan Xu , Yuchen Fan , and Kai Yu
                                        In International Conference on Multimodal Interaction, ICMI ’12, Santa Monica, CA, USA, October 22-26, 2012 , Oct 2012
                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file + 📃论文 | X - LANCE

                                      📃论文

                                      论文按时间倒序列出。

                                      2024

                                      1. Advanced Long-Content Speech Recognition With Factorized Neural Transducer
                                        Xun Gong , Yu Wu , Jinyu Li , Shujie Liu , Rui Zhao , Xie Chen, and Yanmin Qian
                                        IEEE ACM Trans. Audio Speech Lang. Process., 2024
                                      2. EAT: Self-Supervised Pre-Training with Efficient Audio Transformer
                                        Wenxi Chen , Yuzhe Liang , Ziyang Ma , Zhisheng Zheng , and Xie Chen
                                        CoRR, 2024
                                      3. ELLA-V: Stable Neural Codec Language Modeling with Alignment-guided Sequence Reordering
                                        Yakun Song , Zhuo Chen , Xiaofei Wang , Ziyang Ma , and Xie Chen
                                        CoRR, 2024
                                      4. BAT: Learning to Reason about Spatial Sounds with Large Language Models
                                        Zhisheng Zheng , Puyuan Peng , Ziyang Ma , Xie Chen, Eunsol Choi , and David Harwath
                                        CoRR, 2024
                                      5. An Embarrassingly Simple Approach for LLM with Strong ASR Capacity
                                        Ziyang Ma , Guanrou Yang , Yifan Yang , Zhifu Gao , Jiaming Wang , Zhihao Du , Fan Yu , Qian Chen , Siqi Zheng , Shiliang Zhang , and Xie Chen
                                        CoRR, 2024
                                      6. Beyond the Status Quo: A Contemporary Survey of Advances and Challenges in Audio Captioning
                                        Xuenan Xu , Zeyu Xie , Mengyue Wu, and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., 2024
                                      7. Towards Weakly Supervised Text-to-Audio Grounding
                                        Xuenan Xu , Ziyang Ma , Mengyue Wu, and Kai Yu
                                        CoRR, 2024
                                      8. VALL-T: Decoder-Only Generative Transducer for Robust and Decoding-Controllable Text-to-Speech
                                        Chenpeng Du , Yiwei Guo , Hankun Wang , Yifan Yang , Zhikang Niu , Shuai Wang , Hui Zhang , Xie Chen, and Kai Yu
                                        CoRR, 2024
                                      9. ChemDFM: Dialogue Foundation Model for Chemistry
                                        Zihan Zhao , Da Ma , Lu Chen, Liangtai Sun , Zihao Li , Hongshen Xu , Zichen Zhu , Su Zhu , Shuai Fan , Guodong Shen , Xin Chen , and Kai Yu
                                        CoRR, 2024
                                      10. MULTI: Multimodal Understanding Leaderboard with Text and Images
                                        Zichen Zhu, Yang Xu , Lu Chen, Jingkai Yang , Yichuan Ma , Yiming Sun , Hailin Wen , Jiaqi Liu , Jinyu Cai , Yingzi Ma , Situo Zhang , Zihan Zhao , Liangtai Sun , and Kai Yu
                                        CoRR, 2024

                                      2023

                                      1. A Unified Framework From Face Image Restoration to Data Augmentation Using Generative Prior
                                        Jiawei You , Ganyu Huang , Tianyuan Han , Haoze Yang , and Liping Shen
                                        IEEE Access, 2023
                                      2. Human Pose Estimation with Combined Feature Maps and Joint Embeddings
                                        Tianyuan Han , Ganyu Huang , Chunhui Li , and Liping Shen
                                        In Proceedings of the 2023 International Conference on Advances in Artificial Intelligence and Applications, AAIA 2023, Wuhan, China, November 18-20, 2023 , 2023
                                      3. Assessing and Enhancing LLMs: A Physics and History Dataset and One-More-Check Pipeline Method
                                        Chaofan He , Chunhui Li , Tianyuan Han , and Liping Shen
                                        In Neural Information Processing - 30th International Conference, ICONIP 2023, Changsha, China, November 20-23, 2023, Proceedings, Part XIII , 2023
                                      4. GAN Latent Space Manipulation Based Augmentation for Unbalanced Emotion Datasets
                                        Yuhan Xiong , Jiawei You , and Liping Shen
                                        In International Joint Conference on Neural Networks, IJCNN 2023, Gold Coast, Australia, June 18-23, 2023 , 2023
                                      5. LongFNT: Long-Form Speech Recognition with Factorized Neural Transducer
                                        Xun Gong , Yu Wu , Jinyu Li , Shujie Liu , Rui Zhao , Xie Chen, and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
                                      6. Factorized AED: Factorized Attention-Based Encoder-Decoder for Text-Only Domain Adaptive ASR
                                        Xun Gong , Wei Wang , Hang Shao , Xie Chen, and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
                                      7. Exploring Binary Classification Loss for Speaker Verification
                                        Bing Han , Zhengyang Chen , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
                                      8. Improving Dino-Based Self-Supervised Speaker Verification with Progressive Cluster-Aware Training
                                        Bing Han , Wen Huang , Zhengyang Chen , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2023 - Workshops, Rhodes Island, Greece, June 4-10, 2023 , 2023
                                      9. Robust Audio-Visual ASR with Unified Cross-Modal Attention
                                        Jiahong Li , Chenda Li , Yifei Wu , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
                                      10. Target Sound Extraction with Variable Cross-Modality Clues
                                        Chenda Li , Yao Qian , Zhuo Chen , Dongmei Wang , Takuya Yoshioka , Shujie Liu , Yanmin Qian , and Michael Zeng
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
                                      11. Predictive Skim: Contrastive Predictive Coding for Low-Latency Online Speech Separation
                                        Chenda Li , Yifei Wu , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
                                      12. Multi-Speaker End-to-End Multi-Modal Speaker Diarization System for the MISP 2022 Challenge
                                        Tao Liu , Zhengyang Chen , Yanmin Qian , and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
                                      13. Joint Discriminator and Transfer Based Fast Domain Adaptation For End-To-End Speech Recognition
                                        Hang Shao , Tian Tan , Wei Wang , Xun Gong , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
                                      14. Lowbit Neural Network Quantization for Speaker Verification
                                        Haoyu Wang , Bei Liu , Yifei Wu , Zhengyang Chen , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2023 - Workshops, Rhodes Island, Greece, June 4-10, 2023 , 2023
                                      15. Wespeaker: A Research and Production Oriented Speaker Embedding Learning Toolkit
                                        Hongji Wang , Chengdong Liang , Shuai Wang , Zhengyang Chen , Binbin Zhang , Xu Xiang , Yanlei Deng , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
                                      16. HuBERT-AGG: Aggregated Representation Distillation of Hidden-Unit Bert for Robust Speech Recognition
                                        Wei Wang , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
                                      17. Light-Weight Visualvoice: Neural Network Quantization On Audio Visual Speech Separation
                                        Yifei Wu , Chenda Li , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2023 - Workshops, Rhodes Island, Greece, June 4-10, 2023 , 2023
                                      18. Code-Switching Text Generation and Injection in Mandarin-English ASR
                                        Haibin Yu , Yuxuan Hu , Yao Qian , Ma Jin , Linquan Liu , Shujie Liu , Yu Shi , Yanmin Qian , Edward Lin , and Michael Zeng
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
                                      19. Adaptive Large Margin Fine-Tuning For Robust Speaker Verification
                                        Leying Zhang , Zhengyang Chen , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , 2023
                                      20. ComSL: A Composite Speech-Language Model for End-to-End Speech-to-Text Translation
                                        Chenyang Le , Yao Qian , Long Zhou , Shujie Liu , Yanmin Qian , Michael Zeng , and Xuedong Huang
                                        In Advances in Neural Information Processing Systems 36: Annual Conference on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans, LA, USA, December 10 - 16, 2023 , 2023
                                      21. Exploring the Integration of Speech Separation and Recognition with Self-Supervised Learning Representation
                                        Yoshiki Masuyama , Xuankai Chang , Wangyou Zhang , Samuele Cornell , Zhong-Qiu Wang , Nobutaka Ono , Yanmin Qian , and Shinji Watanabe
                                        In IEEE Workshop on Applications of Signal Processing to Audio and Acoustics, WASPAA 2023, New Paltz, NY, USA, October 22-25, 2023 , 2023
                                      22. Software Design and User Interface of ESPnet-SE++: Speech Enhancement for Robust Speech Processing (espnet-v.202310) (Version 1)
                                        Yen-Ju Lu , Xuankai Chang , Chenda Li , Wangyou Zhang , Samuele Cornell , Zhaoheng Ni , Yoshiki Masuyama , Brian Yan , Robin Scheibler , Zhong-Qiu Wang , Yu Tsao , Yanmin Qian , and Shinji Watanabe
                                        Oct 2023
                                        Accessed on YYYY-MM-DD.
                                      23. Self-Supervised Learning with Cluster-Aware-DINO for High-Performance Robust Speaker Verification
                                        Bing Han , Zhengyang Chen , and Yanmin Qian
                                        CoRR, Oct 2023
                                      24. Attention-based Encoder-Decoder Network for End-to-End Neural Speaker Diarization with Target Speaker Attractor
                                        Zhengyang Chen , Bing Han , Shuai Wang , and Yanmin Qian
                                        CoRR, Oct 2023
                                      25. Whisper-KDQ: A Lightweight Whisper via Guided Knowledge Distillation and Quantization for Efficient ASR
                                        Hang Shao , Wei Wang , Bei Liu , Xun Gong , Haoyu Wang , and Yanmin Qian
                                        CoRR, Oct 2023
                                      26. Weakly-Supervised Speech Pre-training: A Case Study on Target Speech Recognition
                                        Wangyou Zhang , and Yanmin Qian
                                        CoRR, Oct 2023
                                      27. Adapting Multi-Lingual ASR Models for Handling Multiple Talkers
                                        Chenda Li , Yao Qian , Zhuo Chen , Naoyuki Kanda , Dongmei Wang , Takuya Yoshioka , Yanmin Qian , and Michael Zeng
                                        CoRR, Oct 2023
                                      28. InstructME: An Instruction Guided Music Edit And Remix Framework with Latent Diffusion Models
                                        Bing Han , Junyu Dai , Xuchen Song , Weituo Hao , Xinyan He , Dong Guo , Jitong Chen , Yuxuan Wang , and Yanmin Qian
                                        CoRR, Oct 2023
                                      29. Attention-based Encoder-Decoder End-to-End Neural Diarization with Embedding Enhancer
                                        Zhengyang Chen , Bing Han , Shuai Wang , and Yanmin Qian
                                        CoRR, Oct 2023
                                      30. USED: Universal Speaker Extraction and Diarization
                                        Junyi Ao , Mehmet Sinan Yildirim , Meng Ge , Shuai Wang , Ruijie Tao , Yanmin Qian , Liqun Deng , Longshuai Xiao , and Haizhou Li
                                        CoRR, Oct 2023
                                      31. Leveraging In-the-Wild Data for Effective Self-Supervised Pretraining in Speaker Recognition
                                        Shuai Wang , Qibing Bai , Qi Liu , Jianwei Yu , Zhengyang Chen , Bing Han , Yanmin Qian , and Haizhou Li
                                        CoRR, Oct 2023
                                      32. The second multi-channel multi-party meeting transcription challenge (M2MeT) 2.0): A benchmark for speaker-attributed ASR
                                        Yuhao Liang , Mohan Shi , Fan Yu , Yangze Li , Shiliang Zhang , Zhihao Du , Qian Chen , Lei Xie , Yanmin Qian , Jian Wu , Zhuo Chen , Kong Aik Lee , Zhijie Yan , and Hui Bu
                                        CoRR, Oct 2023
                                      33. Diffusion Conditional Expectation Model for Efficient and Robust Target Speech Extraction
                                        Leying Zhang , Yao Qian , Linfeng Yu , Heming Wang , Xinkai Wang , Hemin Yang , Long Zhou , Shujie Liu , Yanmin Qian , and Michael Zeng
                                        CoRR, Oct 2023
                                      34. Toward Universal Speech Enhancement for Diverse Input Conditions
                                        Wangyou Zhang , Kohei Saijo , Zhong-Qiu Wang , Shinji Watanabe , and Yanmin Qian
                                        CoRR, Oct 2023
                                      35. One-Shot Sensitivity-Aware Mixed Sparsity Pruning for Large Language Models
                                        Hang Shao , Bei Liu , and Yanmin Qian
                                        CoRR, Oct 2023
                                      36. FAT-HuBERT: Front-end Adaptive Training of Hidden-unit BERT for Distortion-Invariant Robust Speech Recognition
                                        Dongning Yang , Wei Wang , and Yanmin Qian
                                        CoRR, Oct 2023
                                      37. Speaker Adaptive Text-to-Speech With Timbre-Normalized Vector-Quantized Feature
                                        Chenpeng Du , Yiwei Guo , Xie Chen, and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2023
                                      38. Fast-Hubert: an Efficient Training Framework for Self-Supervised Speech Representation Learning
                                        Guanrou Yang , Ziyang Ma , Zhisheng Zheng , Yakun Song , Zhikang Niu , and Xie Chen
                                        In IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2023, Taipei, Taiwan, December 16-20, 2023 , Oct 2023
                                      39. Improving Few-Shot Learning for Talking Face System with TTS Data Augmentation
                                        Qi Chen , Ziyang Ma , Tao Liu , Xu Tan , Qu Lu , Kai Yu , and Xie Chen
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , Oct 2023
                                      40. Front-End Adapter: Adapting Front-End Input of Speech Based Self-Supervised Learning for Speech Recognition
                                        Xie Chen, Ziyang Ma , Changli Tang , Yujin Wang , and Zhisheng Zheng
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , Oct 2023
                                      41. Emodiff: Intensity Controllable Emotional Text-to-Speech with Soft-Label Guidance
                                        Yiwei Guo , Chenpeng Du , Xie Chen, and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , Oct 2023
                                      42. DAE-Talker: High Fidelity Speech-Driven Talking Face Generation with Diffusion Autoencoder
                                        Chenpeng Du , Qi Chen , Tianyu He , Xu Tan , Xie ChenKai Yu, Sheng Zhao , and Jiang Bian
                                        In Proceedings of the 31st ACM International Conference on Multimedia, MM 2023, Ottawa, ON, Canada, 29 October 2023- 3 November 2023 , Oct 2023
                                      43. Blank-regularized CTC for Frame Skipping in Neural Transducer
                                        Yifan Yang , Xiaoyu Yang , Liyong Guo , Zengwei Yao , Wei Kang , Fangjun Kuang , Long Lin , Xie Chen, and Daniel Povey
                                        CoRR, Oct 2023
                                      44. UniCATS: A Unified Context-Aware Text-to-Speech Framework with Contextual VQ-Diffusion and Vocoding
                                        Chenpeng Du , Yiwei Guo , Feiyu Shen , Zhijun Liu , Zheng Liang , Xie Chen, Shuai Wang , Hui Zhang , and Kai Yu
                                        CoRR, Oct 2023
                                      45. Improving Code-Switching and Named Entity Recognition in ASR with Speech Editing based Data Augmentation
                                        Zheng Liang , Zheshu Song , Ziyang Ma , Chenpeng Du , Kai Yu , and Xie Chen
                                        CoRR, Oct 2023
                                      46. Pushing the Limits of Unsupervised Unit Discovery for SSL Speech Representation
                                        Ziyang Ma , Zhisheng Zheng , Guanrou Yang , Yu Wang , Chao Zhang , and Xie Chen
                                        CoRR, Oct 2023
                                      47. Towards Effective and Compact Contextual Representation for Conformer Transducer Speech Recognition Systems
                                        Mingyu Cui , Jiawen Kang , Jiajun Deng , Xi Yin , Yutao Xie , Xie Chen, and Xunying Liu
                                        CoRR, Oct 2023
                                      48. DSE-TTS: Dual Speaker Embedding for Cross-Lingual Text-to-Speech
                                        Sen Liu , Yiwei Guo , Chenpeng Du , Xie Chen, and Kai Yu
                                        CoRR, Oct 2023
                                      49. Unsupervised Active Learning: Optimizing Labeling Cost-Effectiveness for Automatic Speech Recognition
                                        Zhisheng Zheng , Ziyang Ma , Yu Wang , and Xie Chen
                                        CoRR, Oct 2023
                                      50. VoiceFlow: Efficient Text-to-Speech with Rectified Flow Matching
                                        Yiwei Guo , Chenpeng Du , Ziyang Ma , Xie Chen, and Kai Yu
                                        CoRR, Oct 2023
                                      51. Towards Universal Speech Discrete Tokens: A Case Study for ASR and TTS
                                        Yifan Yang , Feiyu Shen , Chenpeng Du , Ziyang Ma , Kai Yu, Daniel Povey , and Xie Chen
                                        CoRR, Oct 2023
                                      52. Incorporating Class-based Language Model for Named Entity Recognition in Factorized Neural Transducer
                                        Peng Wang , Yifan Yang , Zheng Liang , Tian Tan , Shiliang Zhang , and Xie Chen
                                        CoRR, Oct 2023
                                      53. Improved Factorized Neural Transducer Model For text-only Domain Adaptation
                                        Junzhe Liu , Jianwei Yu , and Xie Chen
                                        CoRR, Oct 2023
                                      54. Leveraging Speech PTM, Text LLM, and Emotional TTS for Speech Emotion Recognition
                                        Ziyang Ma , Wen Wu , Zhisheng Zheng , Yiwei Guo , Qian Chen , Shiliang Zhang , and Xie Chen
                                        CoRR, Oct 2023
                                      55. Acoustic BPE for Speech Generation with Discrete Tokens
                                        Feiyu Shen , Yiwei Guo , Chenpeng Du , Xie Chen, and Kai Yu
                                        CoRR, Oct 2023
                                      56. Expressive TTS Driven by Natural Language Prompts Using Few Human Annotations
                                        Hanglei Zhang , Yiwei Guo , Sen Liu , Xie Chen, and Kai Yu
                                        CoRR, Oct 2023
                                      57. emotion2vec: Self-Supervised Pre-Training for Speech Emotion Representation
                                        Ziyang Ma , Zhisheng Zheng , Jiaxin Ye , Jinchao Li , Zhifu Gao , Shiliang Zhang , and Xie Chen
                                        CoRR, Oct 2023
                                      58. OPAL: Ontology-Aware Pretrained Language Model for End-to-End Task-Oriented Dialogue
                                        Zhi Chen , Yuncong Liu , Lu Chen , Su Zhu , Mengyue Wu, and Kai Yu
                                        Trans. Assoc. Comput. Linguistics, Oct 2023
                                      59. Transcribing Vocal Communications of Domestic Shiba lnu Dogs
                                        Jieyi Huang , Chunhao Zhang , Mengyue Wu , and Kenny Q. Zhu
                                        In Findings of the Association for Computational Linguistics: ACL 2023, Toronto, Canada, July 9-14, 2023 , Oct 2023
                                      60. Detection of Multiple Mental Disorders from Social Media with Two-Stream Psychiatric Experts
                                        Siyuan Chen , Zhiling Zhang , Mengyue Wu , and Kenny Q. Zhu
                                        In Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing, EMNLP 2023, Singapore, December 6-10, 2023 , Oct 2023
                                      61. Semantic Space Grounded Weighted Decoding for Multi-Attribute Controllable Dialogue Generation
                                        Zhiling Zhang , Mengyue Wu , and Kenny Q. Zhu
                                        In Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing, EMNLP 2023, Singapore, December 6-10, 2023 , Oct 2023
                                      62. Diverse and Vivid Sound Generation from Text Descriptions
                                        Guangwei Li , Xuenan Xu , Lingfeng Dai , Mengyue Wu, and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , Oct 2023
                                      63. Investigating Pooling Strategies and Loss Functions for Weakly-Supervised Text-to-Audio Grounding via Contrastive Learning
                                        Xuenan Xu , Mengyue Wu, and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2023 - Workshops, Rhodes Island, Greece, June 4-10, 2023 , Oct 2023
                                      64. BLAT: Bootstrapping Language-Audio Pre-training based on AudioSet Tag-guided Synthetic Data
                                        Xuenan Xu , Zhiling Zhang , Zelin Zhou , Pingyue Zhang , Zeyu Xie , Mengyue Wu , and Kenny Q. Zhu
                                        In Proceedings of the 31st ACM International Conference on Multimedia, MM 2023, Ottawa, ON, Canada, 29 October 2023- 3 November 2023 , Oct 2023
                                      65. LLM-empowered Chatbots for Psychiatrist and Patient Simulation: Application and Evaluation
                                        Siyuan Chen , Mengyue Wu , Kenny Q. Zhu , Kunyao Lan , Zhiling Zhang , and Lyuchun Cui
                                        CoRR, Oct 2023
                                      66. Enhance Temporal Relations in Audio Captioning with Sound Event Detection
                                        Zeyu Xie , Xuenan Xu , Mengyue Wu, and Kai Yu
                                        CoRR, Oct 2023
                                      67. Improving Audio Caption Fluency with Automatic Error Correction
                                        Hanxue Zhang , Zeyu Xie , Xuenan Xu , Mengyue Wu, and Kai Yu
                                        CoRR, Oct 2023
                                      68. A Large-scale Dataset for Audio-Language Representation Learning
                                        Luoyi Sun , Xuenan Xu , Mengyue Wu, and Weidi Xie
                                        CoRR, Oct 2023
                                      69. Does My Dog "Speak" Like Me? The Acoustic Correlation between Pet Dogs and Their Human Owners
                                        Jieyi Huang , Chunhao Zhang , Yufei Wang , Mengyue Wu , and Kenny Q. Zhu
                                        CoRR, Oct 2023
                                      70. Towards Lexical Analysis of Dog Vocalizations via Online Videos
                                        Yufei Wang , Chunhao Zhang , Jieyi Huang , Mengyue Wu , and Kenny Q. Zhu
                                        CoRR, Oct 2023
                                      71. PsyEval: A Comprehensive Large Language Model Evaluation Benchmark for Mental Health
                                        Haoan Jin , Siyuan Chen , Mengyue Wu , and Kenny Q. Zhu
                                        CoRR, Oct 2023
                                      72. A Heterogeneous Graph to Abstract Syntax Tree Framework for Text-to-SQL
                                        Ruisheng Cao , Lu Chen, Jieyu Li , Hanchong Zhang , Hongshen Xu , Wangyou Zhang , and Kai Yu
                                        IEEE Trans. Pattern Anal. Mach. Intell., Oct 2023
                                      73. Speech Enhancement With Integration of Neural Homomorphic Synthesis and Spectral Masking
                                        Wenbin Jiang , and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2023
                                      74. SPM: A Split-Parsing Method for Joint Multi-Intent Detection and Slot Filling
                                        Sheng Jiang , Su Zhu , Ruisheng Cao , Qingliang Miao , and Kai Yu
                                        In Proceedings of the The 61st Annual Meeting of the Association for Computational Linguistics: Industry Track, ACL 2023, Toronto, Canada, July 9-14, 2023 , Oct 2023
                                      75. Exploring Schema Generalizability of Text-to-SQL
                                        Jieyu Li , Lu Chen, Ruisheng Cao , Su Zhu , Hongshen Xu , Zhi Chen , Hanchong Zhang , and Kai Yu
                                        In Findings of the Association for Computational Linguistics: ACL 2023, Toronto, Canada, July 9-14, 2023 , Oct 2023
                                      76. TeCS: A Dataset and Benchmark for Tense Consistency of Machine Translation
                                        Yiming Ai , Zhiwei He , Kai Yu, and Rui Wang
                                        In Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers), ACL 2023, Toronto, Canada, July 9-14, 2023 , Oct 2023
                                      77. CSS: A Large-scale Cross-schema Chinese Text-to-SQL Medical Dataset
                                        Hanchong Zhang , Jieyu Li , Lu Chen, Ruisheng Cao , Yunyan Zhang , Yu Huang , Yefeng Zheng , and Kai Yu
                                        In Findings of the Association for Computational Linguistics: ACL 2023, Toronto, Canada, July 9-14, 2023 , Oct 2023
                                      78. ACT-SQL: In-Context Learning for Text-to-SQL with Automatically-Generated Chain-of-Thought
                                        Hanchong Zhang , Ruisheng Cao , Lu Chen, Hongshen Xu , and Kai Yu
                                        In Findings of the Association for Computational Linguistics: EMNLP 2023, Singapore, December 6-10, 2023 , Oct 2023
                                      79. Multi-Speaker Multi-Lingual VQTTS System for LIMMITS 2023 Challenge
                                        Chenpeng Du , Yiwei Guo , Feiyu Shen , and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , Oct 2023
                                      80. DiffVoice: Text-to-Speech with Latent Diffusion
                                        Zhijun Liu , Yiwei Guo , and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing ICASSP 2023, Rhodes Island, Greece, June 4-10, 2023 , Oct 2023
                                      81. Large Language Models Are Semi-Parametric Reinforcement Learning Agents
                                        Danyang Zhang , Lu Chen, Situo Zhang , Hongshen Xu , Zihan Zhao , and Kai Yu
                                        In Advances in Neural Information Processing Systems 36: Annual Conference on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans, LA, USA, December 10 - 16, 2023 , Oct 2023
                                      82. Mobile-Env: A Universal Platform for Training and Evaluation of Mobile Interaction
                                        Danyang Zhang , Lu Chen, and Kai Yu
                                        CoRR, Oct 2023
                                      83. SciEval: A Multi-Level Large Language Model Evaluation Benchmark for Scientific Research
                                        Liangtai Sun , Yang Han , Zihan Zhao , Da Ma , Zhennan Shen , Baocai Chen , Lu Chen, and Kai Yu
                                        CoRR, Oct 2023
                                      84. ASTormer: An AST Structure-aware Transformer Decoder for Text-to-SQL
                                        Ruisheng Cao , Hanchong Zhang , Hongshen Xu , Jieyu Li , Da Ma , Lu Chen, and Kai Yu
                                        CoRR, Oct 2023
                                      85. DiffDub: Person-generic Visual Dubbing Using Inpainting Renderer with Diffusion Auto-encoder
                                        Tao Liu , Chenpeng Du , Shuai Fan , Feilong Chen , and Kai Yu
                                        CoRR, Oct 2023
                                      86. SEF-VC: Speaker Embedding Free Zero-Shot Voice Conversion with Cross Attention
                                        Junjie Li , Yiwei Guo , Xie Chen, and Kai Yu
                                        CoRR, Oct 2023

                                      2022

                                      1. Heterogeneous Graph Representation for Knowledge Tracing
                                        Jisen Chen , Jian Shen , Ting Long , Liping Shen, Weinan Zhang , and Yong Yu
                                        In Neural Information Processing - 29th International Conference, ICONIP 2022, Virtual Event, November 22-26, 2022, Proceedings, Part I , Oct 2022
                                      2. A simple but practical method: How to improve the usage of entities in the Chinese question generation
                                        Haoze Yang , Kunyao Lan , Jiawei You , and Liping Shen
                                        In International Joint Conference on Neural Networks, IJCNN 2022, Padua, Italy, July 18-23, 2022 , Oct 2022
                                      3. From Uniform Models To Generic Representations: Stock Return Prediction With Pre-training
                                        Jiawei You , Tianyuan Han , and Liping Shen
                                        In International Joint Conference on Neural Networks, IJCNN 2022, Padua, Italy, July 18-23, 2022 , Oct 2022
                                      4. WavLM: Large-Scale Self-Supervised Pre-Training for Full Stack Speech Processing
                                        Sanyuan Chen , Chengyi Wang , Zhengyang Chen , Yu Wu , Shujie Liu , Zhuo Chen , Jinyu Li , Naoyuki Kanda , Takuya Yoshioka , Xiong Xiao , Jian Wu , Long Zhou , Shuo Ren , Yanmin Qian , Yao Qian , Jian Wu , Michael Zeng , Xiangzhan Yu , and Furu Wei
                                        IEEE J. Sel. Top. Signal Process., Oct 2022
                                      5. Optimizing Data Usage for Low-Resource Speech Recognition
                                        Yanmin Qian , and Zhikai Zhou
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2022
                                      6. Dual-Path Modeling With Memory Embedding Model for Continuous Speech Separation
                                        Chenda Li , Zhuo Chen , and Yanmin Qian
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2022
                                      7. Layer-Wise Fast Adaptation for End-to-End Multi-Accent Speech Recognition
                                        Yanmin Qian , Xun Gong , and Houjun Huang
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2022
                                      8. End-to-End Dereverberation, Beamforming, and Speech Recognition in a Cocktail Party
                                        Wangyou Zhang , Xuankai Chang , Christoph Böddeker , Tomohiro Nakatani , Shinji Watanabe , and Yanmin Qian
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2022
                                      9. Time-Domain Audio-Visual Speech Separation on Low Quality Videos
                                        Yifei Wu , Chenda Li , Jinfeng Bai , Zhongqin Wu , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      10. Skim: Skipping Memory Lstm for Low-Latency Real-Time Continuous Speech Separation
                                        Chenda Li , Lei Yang , Weiqin Wang , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      11. Large-Scale Self-Supervised Speech Representation Learning for Automatic Speaker Verification
                                        Zhengyang Chen , Sanyuan Chen , Yu Wu , Yao Qian , Chengyi Wang , Shujie Liu , Yanmin Qian , and Michael Zeng
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      12. Local Information Modeling with Self-Attention for Speaker Verification
                                        Bing Han , Zhengyang Chen , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      13. Punctuation Prediction for Streaming On-Device Speech Recognition
                                        Zhikai Zhou , Tian Tan , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      14. MLP-SVNET: A Multi-Layer Perceptrons Based Network for Speaker Verification
                                        Bing Han , Zhengyang Chen , Bei Liu , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      15. Self-Knowledge Distillation via Feature Enhancement for Speaker Verification
                                        Bei Liu , Haoyu Wang , Zhengyang Chen , Shuai Wang , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      16. Optimizing Alignment of Speech and Language Latent Spaces for End-To-End Speech Recognition and Understanding
                                        Wei Wang , Shuo Ren , Yao Qian , Shujie Liu , Yu Shi , Yanmin Qian , and Michael Zeng
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      17. Exploring Effective Data Utilization for Low-Resource Speech Recognition
                                        Zhikai Zhou , Wei Wang , Wangyou Zhang , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      18. Summary on the ICASSP 2022 Multi-Channel Multi-Party Meeting Transcription Grand Challenge
                                        Fan Yu , Shiliang Zhang , Pengcheng Guo , Yihui Fu , Zhihao Du , Siqi Zheng , Weilong Huang , Lei Xie , Zheng-Hua Tan , DeLiang Wang , Yanmin Qian , Kong Aik Lee , Zhijie Yan , Bin Ma , Xin Xu , and Hui Bu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      19. The Sjtu System For Multimodal Information Based Speech Processing Challenge 2021
                                        Wei Wang , Xun Gong , Yifei Wu , Zhikai Zhou , Chenda Li , Wangyou Zhang , Bing Han , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      20. Attentive Feature Fusion for Robust Speaker Verification
                                        Bei Liu , Zhengyang Chen , and Yanmin Qian
                                        In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
                                      21. Dual Path Embedding Learning for Speaker Verification with Triplet Attention
                                        Bei Liu , Zhengyang Chen , and Yanmin Qian
                                        In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
                                      22. DF-ResNet: Boosting Speaker Verification Performance with Depth-First Design
                                        Bei Liu , Zhengyang Chen , Shuai Wang , Haoyu Wang , Bing Han , and Yanmin Qian
                                        In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
                                      23. Enroll-Aware Attentive Statistics Pooling for Target Speaker Verification
                                        Leying Zhang , Zhengyang Chen , and Yanmin Qian
                                        In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
                                      24. MSDWild: Multi-modal Speaker Diarization Dataset in the Wild
                                        Tao Liu , Shuai Fan , Xu Xiang , Hongbo Song , Shaoxiong Lin , Jiaqi Sun , Tianyuan Han , Siyuan Chen , Binwei Yao , Sen Liu , Yifei Wu , Yanmin Qian , and Kai Yu
                                        In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
                                      25. Knowledge Transfer and Distillation from Autoregressive to Non-Autoregessive Speech Recognition
                                        Xun Gong , Zhikai Zhou , and Yanmin Qian
                                        In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
                                      26. Self-Supervised Speaker Verification Using Dynamic Loss-Gate and Label Correction
                                        Bing Han , Zhengyang Chen , and Yanmin Qian
                                        In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
                                      27. Separating Long-Form Speech with Group-wise Permutation Invariant Training
                                        Wangyou Zhang , Zhuo Chen , Naoyuki Kanda , Shujie Liu , Jinyu Li , Sefik Emre Eskimez , Takuya Yoshioka , Xiong Xiao , Zhong Meng , Yanmin Qian , and Furu Wei
                                        In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
                                      28. ESPnet-SE++: Speech Enhancement for Robust Speech Recognition, Translation, and Understanding
                                        Yen-Ju Lu , Xuankai Chang , Chenda Li , Wangyou Zhang , Samuele Cornell , Zhaoheng Ni , Yoshiki Masuyama , Brian Yan , Robin Scheibler , Zhong-Qiu Wang , Yu Tsao , Yanmin Qian , and Shinji Watanabe
                                        In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
                                      29. Improving Speech Separation with Knowledge Distilled from Self-supervised Pre-trained Models
                                        Bowen Qu , Chenda Li , Jinfeng Bai , and Yanmin Qian
                                        In 13th International Symposium on Chinese Spoken Language Processing, ISCSLP 2022, Singapore, December 11-14, 2022 , Oct 2022
                                      30. Text-Informed Knowledge Distillation for Robust Speech Enhancement and Recognition
                                        Wei Wang , Wangyou Zhang , Shaoxiong Lin , and Yanmin Qian
                                        In 13th International Symposium on Chinese Spoken Language Processing, ISCSLP 2022, Singapore, December 11-14, 2022 , Oct 2022
                                      31. Medical Difficult Airway Detection using Speech Technology
                                        Zhikai Zhou , Shuang Cao , Zhengyang Chen , Bei Liu , Ming Xia , Hong Jiang , and Yanmin Qian
                                        In 13th International Symposium on Chinese Spoken Language Processing, ISCSLP 2022, Singapore, December 11-14, 2022 , Oct 2022
                                      32. Speaking style compensation on synthetic audio for robust keyword spotting
                                        Houjun Huang , and Yanmin Qian
                                        In 13th International Symposium on Chinese Spoken Language Processing, ISCSLP 2022, Singapore, December 11-14, 2022 , Oct 2022
                                      33. The Conversational Short-phrase Speaker Diarization (CSSD) Task: Dataset, Evaluation Metric and Baselines
                                        Gaofeng Cheng , Yifan Chen , Runyan Yang , Qingxuan Li , Zehui Yang , Lingxuan Ye , Pengyuan Zhang , Qingqing Zhang , Lei Xie , Yanmin Qian , Kong Aik Lee , and Yonghong Yan
                                        In 13th International Symposium on Chinese Spoken Language Processing, ISCSLP 2022, Singapore, December 11-14, 2022 , Oct 2022
                                      34. The X-Lance Speaker Diarization System for the Conversational Short-phrase Speaker Diarization Challenge 2022
                                        Tao Liu , Xu Xiang , Zhengyang Chen , Bing Han , Kai Yu, and Yanmin Qian
                                        In 13th International Symposium on Chinese Spoken Language Processing, ISCSLP 2022, Singapore, December 11-14, 2022 , Oct 2022
                                      35. End-to-End Multi-Speaker ASR with Independent Vector Analysis
                                        Robin Scheibler , Wangyou Zhang , Xuankai Chang , Shinji Watanabe , and Yanmin Qian
                                        In IEEE Spoken Language Technology Workshop, SLT 2022, Doha, Qatar, January 9-12, 2023 , Oct 2022
                                      36. A Comprehensive Study on Self-Supervised Distillation for Speaker Representation Learning
                                        Zhengyang Chen , Yao Qian , Bing Han , Yanmin Qian , and Michael Zeng
                                        In IEEE Spoken Language Technology Workshop, SLT 2022, Doha, Qatar, January 9-12, 2023 , Oct 2022
                                      37. The SJTU X-LANCE Lab System for CNSRC 2022
                                        Zhengyang Chen , Bei Liu , Bing Han , Leying Zhang , and Yanmin Qian
                                        CoRR, Oct 2022
                                      38. SJTU-AISPEECH System for VoxCeleb Speaker Recognition Challenge 2022
                                        Zhengyang Chen , Bing Han , Xu Xiang , Houjun Huang , Bei Liu , and Yanmin Qian
                                        CoRR, Oct 2022
                                      39. Build a SRE Challenge System: Lessons from VoxSRC 2022 and CNSRC 2022
                                        Zhengyang Chen , Bing Han , Xu Xiang , Houjun Huang , Bei Liu , and Yanmin Qian
                                        CoRR, Oct 2022
                                      40. Factorized Neural Transducer for Efficient Language Model Adaptation
                                        Xie Chen, Zhong Meng , Sarangarajan Parthasarathy , and Jinyu Li
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      41. VQTTS: High-Fidelity Text-to-Speech Synthesis with Self-Supervised VQ Acoustic Feature
                                        Chenpeng Du , Yiwei Guo , Xie Chen, and Kai Yu
                                        In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
                                      42. Internal Language Model Adaptation with Text-Only Data for End-to-End Speech Recognition
                                        Zhong Meng , Yashesh Gaur , Naoyuki Kanda , Jinyu Li , Xie Chen , Yu Wu , and Yifan Gong
                                        In Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022 , Oct 2022
                                      43. Exploring Effective Distillation of Self-Supervised Speech Models for Automatic Speech Recognition
                                        Yujin Wang , Changli Tang , Ziyang Ma , Zhisheng Zheng , Xie Chen, and Wei-Qiang Zhang
                                        CoRR, Oct 2022
                                      44. MT4SSL: Boosting Self-Supervised Speech Representation Learning by Integrating Multiple Targets
                                        Ziyang Ma , Zhisheng Zheng , Changli Tang , Yujin Wang , and Xie Chen
                                        CoRR, Oct 2022
                                      45. EmoDiff: Intensity Controllable Emotional Text-to-Speech with Soft-Label Guidance
                                        Yiwei Guo , Chenpeng Du , Xie Chen, and Kai Yu
                                        CoRR, Oct 2022
                                      46. Exploring Effective Fusion Algorithms for Speech Based Self-Supervised Learning Models
                                        Changli Tang , Yujin Wang , Xie Chen, and Wei-Qiang Zhang
                                        CoRR, Oct 2022
                                      47. D4: a Chinese Dialogue Dataset for Depression-Diagnosis-Oriented Chat
                                        Binwei Yao , Chao Shi , Likai Zou , Lingfeng Dai , Mengyue WuLu Chen, Zhen Wang , and Kai Yu
                                        In Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing, EMNLP 2022, Abu Dhabi, United Arab Emirates, December 7-11, 2022 , Oct 2022
                                      48. Symptom Identification for Interpretable Detection of Multiple Mental Disorders on Social Media
                                        Zhiling Zhang , Siyuan Chen , Mengyue Wu , and Kenny Q. Zhu
                                        In Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing, EMNLP 2022, Abu Dhabi, United Arab Emirates, December 7-11, 2022 , Oct 2022
                                      49. Category-Adapted Sound Event Enhancement with Weakly Labeled Data
                                        Guangwei Li , Xuenan Xu , Heinrich Dinkel , Mengyue Wu, and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      50. Diversity-Controllable and Accurate Audio Captioning Based on Neural Condition
                                        Xuenan Xu , Mengyue Wu, and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      51. Can Audio Captions Be Evaluated With Image Caption Metrics?
                                        Zelin Zhou , Zhiling Zhang , Xuenan Xu , Zeyu Xie , Mengyue Wu , and Kenny Q. Zhu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      52. Navigating Audio-Visual Event Detection Across Mismatched Modalities
                                        Guangwei Li , Xuenan Xu , Mengyue Wu, and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      53. Audio-Text Retrieval in Context
                                        Siyu Lou , Xuenan Xu , Mengyue Wu, and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      54. Climate and Weather: Inspecting Depression Detection via Emotion Recognition
                                        Wen Wu , Mengyue Wu, and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      55. Psychiatric Scale Guided Risky Post Screening for Early Detection of Depression
                                        Zhiling Zhang , Siyuan Chen , Mengyue Wu , and Kenny Q. Zhu
                                        In Proceedings of the Thirty-First International Joint Conference on Artificial Intelligence, IJCAI 2022, Vienna, Austria, 23-29 July 2022 , Oct 2022
                                      56. A Comprehensive Survey of Automated Audio Captioning
                                        Xuenan Xu , Mengyue Wu, and Kai Yu
                                        CoRR, Oct 2022
                                      57. DialogZoo: Large-Scale Dialog-Oriented Task Learning
                                        Zhi Chen , Jijia Bao , Lu Chen, Yuncong Liu , Da Ma , Bei Chen , Mengyue Wu , Su Zhu , Jian-Guang Lou , and Kai Yu
                                        CoRR, Oct 2022
                                      58. Data augmentation based non-parallel voice conversion with frame-level speaker disentangler
                                        Bo Chen , Zhihang Xu , and Kai Yu
                                        Speech Commun., Oct 2022
                                      59. Phone-Level Prosody Modelling With GMM-Based MDN for Diverse and Controllable Speech Synthesis
                                        Chenpeng Du , and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2022
                                      60. Neural Fusion for Voice Cloning
                                        Bo Chen , Chenpeng Du , and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2022
                                      61. META-GUI: Towards Multi-modal Conversational Agents on Mobile GUI
                                        Liangtai Sun , Xingyu Chen , Lu Chen, Tianle Dai , Zichen Zhu, and Kai Yu
                                        In Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing, EMNLP 2022, Abu Dhabi, United Arab Emirates, December 7-11, 2022 , Oct 2022
                                      62. AdapterShare: Task Correlation Modeling with Adapter Differentiation
                                        Zhi Chen , Bei Chen , Lu ChenKai Yu, and Jian-Guang Lou
                                        In Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing, EMNLP 2022, Abu Dhabi, United Arab Emirates, December 7-11, 2022 , Oct 2022
                                      63. LatticeBART: Lattice-to-Lattice Pre-Training for Speech Recognition
                                        Lingfeng Dai , Lu Chen, Zhikai Zhou , and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      64. Text Adaptive Detection for Customizable Keyword Spotting
                                        Yu Xi , Tian Tan , Wangyou Zhang , Baochen Yang , and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      65. Unsupervised Word-Level Prosody Tagging for Controllable Speech Synthesis
                                        Yiwei Guo , Chenpeng Du , and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2022, Virtual and Singapore, 23-27 May 2022 , Oct 2022
                                      66. The AISP-SJTU Simultaneous Translation System for IWSLT 2022
                                        Qinpei Zhu , Renshou Wu , Guangfeng Liu , Xinyu Zhu , Xingyu Chen , Yang Zhou , Qingliang Miao , Rui Wang , and Kai Yu
                                        In Proceedings of the 19th International Conference on Spoken Language Translation, IWSLT@ACL 2022, Dublin, Ireland (in-person and online), May 26-27, 2022 , Oct 2022
                                      67. TIE: Topological Information Enhanced Structural Reading Comprehension on Web Pages
                                        Zihan Zhao , Lu Chen, Ruisheng Cao , Hongshen Xu , Xingyu Chen , and Kai Yu
                                        In Proceedings of the 2022 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, NAACL 2022, Seattle, WA, United States, July 10-15, 2022 , Oct 2022
                                      68. UniDU: Towards A Unified Generative Dialogue Understanding Framework
                                        Zhi Chen , Lu Chen , Bei Chen , Libo Qin , Yuncong Liu , Su Zhu , Jian-Guang Lou , and Kai Yu
                                        In Proceedings of the 23rd Annual Meeting of the Special Interest Group on Discourse and Dialogue, SIGDIAL 2022, Edinburgh, UK, 07-09 September 2022 , Oct 2022
                                      69. The AISP-SJTU Translation System for WMT 2022
                                        Guangfeng Liu , Qinpei Zhu , Xingyu Chen , Renjie Feng , Jianxin Ren , Renshou Wu , Qingliang Miao , Rui Wang , and Kai Yu
                                        In Proceedings of the Seventh Conference on Machine Translation, WMT 2022, Abu Dhabi, United Arab Emirates (Hybrid), December 7-8, 2022 , Oct 2022

                                      2021

                                      1. Modified Magnitude-Phase Spectrum Information for Spoofing Detection
                                        Jichen Yang , Hongji Wang , Rohan Kumar Das , and Yanmin Qian
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2021
                                      2. Audio-Visual Deep Neural Network for Robust Person Verification
                                        Yanmin Qian , Zhengyang Chen , and Shuai Wang
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2021
                                      3. Dual-Path Modeling for Long Recording Speech Separation in Meetings
                                        Chenda Li , Zhuo Chen , Yi Luo , Cong Han , Tianyan Zhou , Keisuke Kinoshita , Marc Delcroix , Shinji Watanabe , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
                                      4. Self-Supervised Learning Based Domain Adaptation for Robust Speaker Verification
                                        Zhengyang Chen , Shuai Wang , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
                                      5. SynAug: Synthesis-Based Data Augmentation for Text-Dependent Speaker Verification
                                        Chenpeng Du , Bing Han , Shuai Wang , Yanmin Qian , and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
                                      6. Unit Selection Synthesis Based Data Augmentation for Fixed Phrase Speaker Verification
                                        Houjun Huang , Xu Xiang , Fei Zhao , Shuai Wang , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
                                      7. AISpeech-SJTU Accent Identification System for the Accented English Speech Recognition Challenge
                                        Houjun Huang , Xu Xiang , Yexin Yang , Rao Ma , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
                                      8. AISpeech-SJTU ASR System for the Accented English Speech Recognition Challenge
                                        Tian Tan , Yizhou Lu , Rao Ma , Sen Zhu , Jiaqi Guo , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
                                      9. Towards Data Selection on TTS Data for Children’s Speech Recognition
                                        Wei Wang , Zhikai Zhou , Yizhou Lu , Hongji Wang , Chenpeng Du , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
                                      10. End-to-End Dereverberation, Beamforming, and Speech Recognition with Improved Numerical Stability and Advanced Frontend
                                        Wangyou Zhang , Christoph Böddeker , Shinji Watanabe , Tomohiro Nakatani , Marc Delcroix , Keisuke Kinoshita , Tsubasa Ochiai , Naoyuki Kamo , Reinhold Haeb-Umbach , and Yanmin Qian
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
                                      11. The Accented English Speech Recognition Challenge 2020: Open Datasets, Tracks, Baselines, Results and Methods
                                        Xian Shi , Fan Yu , Yizhou Lu , Yuhao Liang , Qiangze Feng , Daliang Wang , Yanmin Qian , and Lei Xie
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
                                      12. Convolutive Transfer Function Invariant SDR Training Criteria for Multi-Channel Reverberant Speech Separation
                                        Christoph Böddeker , Wangyou Zhang , Tomohiro Nakatani , Keisuke Kinoshita , Tsubasa Ochiai , Marc Delcroix , Naoyuki Kamo , Yanmin Qian , and Reinhold Haeb-Umbach
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
                                      13. Layer-Wise Fast Adaptation for End-to-End Multi-Accent Speech Recognition
                                        Xun Gong , Yizhou Lu , Zhikai Zhou , and Yanmin Qian
                                        In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
                                      14. Knowledge Distillation from Multi-Modality to Single-Modality for Person Verification
                                        Leying Zhang , Zhengyang Chen , and Yanmin Qian
                                        In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
                                      15. Basis-MelGAN: Efficient Neural Vocoder Based on Audio Decomposition
                                        Zhengxi Liu , and Yanmin Qian
                                        In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
                                      16. The SJTU System for Short-Duration Speaker Verification Challenge 2021
                                        Bing Han , Zhengyang Chen , Zhikai Zhou , and Yanmin Qian
                                        In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
                                      17. Audio-Visual Multi-Talker Speech Recognition in a Cocktail Party
                                        Yifei Wu , Chenda Li , Song Yang , Zhongqin Wu , and Yanmin Qian
                                        In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
                                      18. Speaker Embedding Augmentation with Noise Distribution Matching
                                        Xun Gong , Zhengyang Chen , Yexin Yang , Shuai Wang , Lan Wang , and Yanmin Qian
                                        In 12th International Symposium on Chinese Spoken Language Processing, ISCSLP 2021, Hong Kong, January 24-27, 2021 , Oct 2021
                                      19. Revisiting the Statistics Pooling Layer in Deep Speaker Embedding Learning
                                        Shuai Wang , Yexin Yang , Yanmin Qian , and Kai Yu
                                        In 12th International Symposium on Chinese Spoken Language Processing, ISCSLP 2021, Hong Kong, January 24-27, 2021 , Oct 2021
                                      20. Data Augmentation for end-to-end Code-Switching Speech Recognition
                                        Chenpeng Du , Hao Li , Yizhou Lu , Lan Wang , and Yanmin Qian
                                        In IEEE Spoken Language Technology Workshop, SLT 2021, Shenzhen, China, January 19-22, 2021 , Oct 2021
                                      21. Dual-Path RNN for Long Recording Speech Separation
                                        Chenda Li , Yi Luo , Cong Han , Jinyu Li , Takuya Yoshioka , Tianyan Zhou , Marc Delcroix , Keisuke Kinoshita , Christoph Böddeker , Yanmin Qian , Shinji Watanabe , and Zhuo Chen
                                        In IEEE Spoken Language Technology Workshop, SLT 2021, Shenzhen, China, January 19-22, 2021 , Oct 2021
                                      22. Closing the Gap Between Time-Domain Multi-Channel Speech Enhancement on Real and Simulation Conditions
                                        Wangyou Zhang , Jing Shi , Chenda Li , Shinji Watanabe , and Yanmin Qian
                                        In IEEE Workshop on Applications of Signal Processing to Audio and Acoustics, WASPAA 2021, New Paltz, NY, USA, October 17-20, 2021 , Oct 2021
                                      23. Towards Duration Robust Weakly Supervised Sound Event Detection
                                        Heinrich Dinkel , Mengyue Wu, and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2021
                                      24. Voice Activity Detection in the Wild: A Data-Driven Approach Using Teacher-Student Training
                                        Heinrich Dinkel , Shuai Wang , Xuenan Xu , Mengyue Wu, and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2021
                                      25. Building Interpretable Interaction Trees for Deep NLP Models
                                        Die Zhang , Hao Zhang , Huilin Zhou , Xiaoyi Bao , Da Huo , Ruizhao Chen , Xu Cheng , Mengyue Wu, and Quanshi Zhang
                                        In Thirty-Fifth AAAI Conference on Artificial Intelligence, AAAI 2021, Thirty-Third Conference on Innovative Applications of Artificial Intelligence, IAAI 2021, The Eleventh Symposium on Educational Advances in Artificial Intelligence, EAAI 2021, Virtual Event, February 2-9, 2021 , Oct 2021
                                      26. Decoupled Dialogue Modeling and Semantic Parsing for Multi-Turn Text-to-SQL
                                        Zhi Chen , Lu Chen, Hanqi Li , Ruisheng Cao , Da Ma , Mengyue Wu, and Kai Yu
                                        In Findings of the Association for Computational Linguistics: ACL/IJCNLP 2021, Online Event, August 1-6, 2021 , Oct 2021
                                      27. Enriching Ontology with Temporal Commonsense for Low-Resource Audio Tagging
                                        Zhiling Zhang , Zelin Zhou , Haifeng Tang , Guangwei Li , Mengyue Wu , and Kenny Q. Zhu
                                        In CIKM ’21: The 30th ACM International Conference on Information and Knowledge Management, Virtual Event, Queensland, Australia, November 1 - 5, 2021 , Oct 2021
                                      28. Text-to-Audio Grounding: Building Correspondence Between Captions and Sound Events
                                        Xuenan Xu , Heinrich Dinkel , Mengyue Wu, and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
                                      29. Investigating Local and Global Information for Automated Audio Captioning with Transfer Learning
                                        Xuenan Xu , Heinrich Dinkel , Mengyue Wu, Zeyu Xie , and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2021, Toronto, ON, Canada, June 6-11, 2021 , Oct 2021
                                      30. A Lightweight Framework for Online Voice Activity Detection in the Wild
                                        Xuenan Xu , Heinrich Dinkel , Mengyue Wu, and Kai Yu
                                        In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
                                      31. Audio Caption in a Car Setting with a Sentence-Level Loss
                                        Xuenan Xu , Heinrich Dinkel , Mengyue Wu, and Kai Yu
                                        In 12th International Symposium on Chinese Spoken Language Processing, ISCSLP 2021, Hong Kong, January 24-27, 2021 , Oct 2021
                                      32. DEPA: Self-Supervised Audio Embedding for Depression Detection
                                        Pingyue Zhang , Mengyue Wu, Heinrich Dinkel , and Kai Yu
                                        In MM ’21: ACM Multimedia Conference, Virtual Event, China, October 20 - 24, 2021 , Oct 2021
                                      33. LET: Linguistic Knowledge Enhanced Graph Transformer for Chinese Short Text Matching
                                        Boer Lyu , Lu Chen , Su Zhu , and Kai Yu
                                        In Thirty-Fifth AAAI Conference on Artificial Intelligence, AAAI 2021, Thirty-Third Conference on Innovative Applications of Artificial Intelligence, IAAI 2021, The Eleventh Symposium on Educational Advances in Artificial Intelligence, EAAI 2021, Virtual Event, February 2-9, 2021 , Oct 2021
                                      34. LGESQL: Line Graph Enhanced Text-to-SQL Model with Mixed Local and Non-Local Relations
                                        Ruisheng Cao , Lu Chen , Zhi Chen , Yanbin Zhao , Su Zhu , and Kai Yu
                                        In Proceedings of the 59th Annual Meeting of the Association for Computational Linguistics and the 11th International Joint Conference on Natural Language Processing, ACL/IJCNLP 2021, (Volume 1: Long Papers), Virtual Event, August 1-6, 2021 , Oct 2021
                                      35. WebSRC: A Dataset for Web-Based Structural Reading Comprehension
                                        Xingyu Chen , Zihan Zhao , Lu Chen, Jiabao Ji , Danyang Zhang , Ao Luo , Yuxuan Xiong , and Kai Yu
                                        In Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing, EMNLP 2021, Virtual Event / Punta Cana, Dominican Republic, 7-11 November, 2021 , Oct 2021
                                      36. Glyph Enhanced Chinese Character Pre-Training for Lexical Sememe Prediction
                                        Boer Lyu , Lu Chen, and Kai Yu
                                        In Findings of the Association for Computational Linguistics: EMNLP 2021, Virtual Event / Punta Cana, Dominican Republic, 16-20 November, 2021 , Oct 2021
                                      37. Class-Based Neural Network Language Model for Second-Pass Rescoring in ASR
                                        Lingfeng Dai , Qi Liu , and Kai Yu
                                        In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
                                      38. Rich Prosody Diversity Modelling with Phone-Level Mixture Density Network
                                        Chenpeng Du , and Kai Yu
                                        In Interspeech 2021, 22nd Annual Conference of the International Speech Communication Association, Brno, Czechia, 30 August - 3 September 2021 , Oct 2021
                                      39. ShadowGNN: Graph Projection Neural Network for Text-to-SQL Parser
                                        Zhi Chen , Lu Chen, Yanbin Zhao , Ruisheng Cao , Zihan Xu , Su Zhu , and Kai Yu
                                        In Proceedings of the 2021 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, NAACL-HLT 2021, Online, June 6-11, 2021 , Oct 2021
                                      40. Few-Shot NLU with Vector Projection Distance and Abstract Triangular CRF
                                        Su Zhu , Lu Chen, Ruisheng Cao , Zhi Chen , Qingliang Miao , and Kai Yu
                                        In Natural Language Processing and Chinese Computing - 10th CCF International Conference, NLPCC 2021, Qingdao, China, October 13-17, 2021, Proceedings, Part I , Oct 2021
                                      41. Relation-Aware Multi-hop Reasoning forVisual Dialog
                                        Yao Zhao , Lu Chen, and Kai Yu
                                        In Natural Language Processing and Chinese Computing - 10th CCF International Conference, NLPCC 2021, Qingdao, China, October 13-17, 2021, Proceedings, Part I , Oct 2021
                                      42. Mixture Density Network for Phone-Level Prosody Modelling in Speech Synthesis
                                        Chenpeng Du , and Kai Yu
                                        CoRR, Oct 2021
                                      43. Diverse and Controllable Speech Synthesis with GMM-Based Phone-Level Prosody Modelling
                                        Chenpeng Du , and Kai Yu
                                        CoRR, Oct 2021

                                      2020

                                      1. Improving End-to-End Single-Channel Multi-Talker Speech Recognition
                                        Wangyou Zhang , Xuankai Chang , Yanmin Qian , and Shinji Watanabe
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2020
                                      2. Data Augmentation Using Deep Generative Models for Embedding Based Speaker Recognition
                                        Shuai Wang , Yexin Yang , Zhanghao Wu , Yanmin Qian , and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2020
                                      3. End-To-End Multi-Speaker Speech Recognition With Transformer
                                        Xuankai Chang , Wangyou Zhang , Yanmin Qian , Jonathan Le Roux , and Shinji Watanabe
                                        In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
                                      4. Text Adaptation for Speaker Verification with Speaker-Text Factorized Embeddings
                                        Yexin Yang , Shuai Wang , Xun Gong , Yanmin Qian , and Kai Yu
                                        In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
                                      5. Channel Invariant Speaker Embedding Learning with Joint Multi-Task and Adversarial Training
                                        Zhengyang Chen , Shuai Wang , Yanmin Qian , and Kai Yu
                                        In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
                                      6. Deep Audio-Visual Speech Separation with Attention Mechanism
                                        Chenda Li , and Yanmin Qian
                                        In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
                                      7. Learning Contextual Language Embeddings for Monaural Multi-Talker Speech Recognition
                                        Wangyou Zhang , and Yanmin Qian
                                        In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
                                      8. End-to-End Far-Field Speech Recognition with Unified Dereverberation and Beamforming
                                        Wangyou Zhang , Aswin Shanmugam Subramanian , Xuankai Chang , Shinji Watanabe , and Yanmin Qian
                                        In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
                                      9. Dual-Adversarial Domain Adaptation for Generalized Replay Attack Detection
                                        Hongji Wang , Heinrich Dinkel , Shuai Wang , Yanmin Qian , and Kai Yu
                                        In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
                                      10. Listen, Watch and Understand at the Cocktail Party: Audio-Visual-Contextual Speech Separation
                                        Chenda Li , and Yanmin Qian
                                        In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
                                      11. Multi-Modality Matters: A Performance Leap on VoxCeleb
                                        Zhengyang Chen , Shuai Wang , and Yanmin Qian
                                        In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
                                      12. Adversarial Domain Adaptation for Speaker Verification Using Partially Shared Network
                                        Zhengyang Chen , Shuai Wang , and Yanmin Qian
                                        In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
                                      13. Bi-Encoder Transformer Network for Mandarin-English Code-Switching Speech Recognition Using Mixture of Experts
                                        Yizhou Lu , Mingkun Huang , Hao Li , Jiaqi Guo , and Yanmin Qian
                                        In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
                                      14. End-to-End Speaker-Dependent Voice Activity Detection
                                        Yefei Chen , Shuai Wang , Yanmin Qian , and Kai Yu
                                        CoRR, Oct 2020
                                      15. A CRNN-GRU Based Reinforcement Learning Approach to Audio Captioning
                                        Xuenan Xu , Heinrich Dinkel , Mengyue Wu, and Kai Yu
                                        In Proceedings of 5th the Workshop on Detection and Classification of Acoustic Scenes and Events 2020 (DCASE 2020), Tokyo, Japan (full virtual), November 2-4, 2020 , Oct 2020
                                      16. Multiple Sound Sources Localization from Coarse to Fine
                                        Rui Qian , Di Hu , Heinrich Dinkel , Mengyue Wu, Ning Xu , and Weiyao Lin
                                        In Computer Vision - ECCV 2020 - 16th European Conference, Glasgow, UK, August 23-28, 2020, Proceedings, Part XX , Oct 2020
                                      17. Voice Activity Detection in the Wild via Weakly Supervised Sound Event Detection
                                        Yefei Chen , Heinrich Dinkel , Mengyue Wu, and Kai Yu
                                        In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
                                      18. GPVAD: Towards noise robust voice activity detection via weakly supervised sound event detection
                                        Heinrich Dinkel , Yefei Chen , Mengyue Wu, and Kai Yu
                                        CoRR, Oct 2020
                                      19. Interpreting Hierarchical Linguistic Interactions in DNNs
                                        Die Zhang , Huilin Zhou , Xiaoyi Bao , Da Huo , Ruizhao Chen , Xu Cheng , Hao Zhang , Mengyue Wu, and Quanshi Zhang
                                        CoRR, Oct 2020
                                      20. Towards a new generation of artificial intelligence in China
                                        Fei Wu , Cewu Lu , Mingjie Zhu , Hao Chen , Jun Zhu , Kai Yu, Lei Li , Ming Li , Qianfeng Chen , Xi Li , Xudong Cao , Zhongyuan Wang , Zhengjun Zha , Yueting Zhuang , and Yunhe Pan
                                        Nat. Mach. Intell., Oct 2020
                                      21. Prior Knowledge Driven Label Embedding for Slot Filling in Natural Language Understanding
                                        Su Zhu , Zijian Zhao , Rao Ma , and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2020
                                      22. Dual Learning for Semi-Supervised Natural Language Understanding
                                        Su Zhu , Ruisheng Cao , and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2020
                                      23. Modular End-to-End Automatic Speech Recognition Framework for Acoustic-to-Word Model
                                        Qi Liu , Zhehuai Chen , Hao Li , Mingkun Huang , Yizhou Lu , and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2020
                                      24. Distributed Structured Actor-Critic Reinforcement Learning for Universal Dialogue Management
                                        Zhi Chen , Lu Chen, Xiaoyuan Liu , and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2020
                                      25. Neural Network Language Model Compression With Product Quantization and Soft Binarization
                                        Kai Yu, Rao Ma , Kaiyu Shi , and Qi Liu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2020
                                      26. Schema-Guided Multi-Domain Dialogue State Tracking with Graph Attention Neural Networks
                                        Lu Chen, Boer Lv , Chi Wang , Su Zhu , Bowen Tan , and Kai Yu
                                        In The Thirty-Fourth AAAI Conference on Artificial Intelligence, AAAI 2020, The Thirty-Second Innovative Applications of Artificial Intelligence Conference, IAAI 2020, The Tenth AAAI Symposium on Educational Advances in Artificial Intelligence, EAAI 2020, New York, NY, USA, February 7-12, 2020 , Oct 2020
                                      27. Semi-Supervised Text Simplification with Back-Translation and Asymmetric Denoising Autoencoders
                                        Yanbin Zhao , Lu Chen , Zhi Chen , and Kai Yu
                                        In The Thirty-Fourth AAAI Conference on Artificial Intelligence, AAAI 2020, The Thirty-Second Innovative Applications of Artificial Intelligence Conference, IAAI 2020, The Tenth AAAI Symposium on Educational Advances in Artificial Intelligence, EAAI 2020, New York, NY, USA, February 7-12, 2020 , Oct 2020
                                      28. Line Graph Enhanced AMR-to-Text Generation with Mix-Order Graph Attention Networks
                                        Yanbin Zhao , Lu Chen , Zhi Chen , Ruisheng Cao , Su Zhu , and Kai Yu
                                        In Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics, ACL 2020, Online, July 5-10, 2020 , Oct 2020
                                      29. Neural Graph Matching Networks for Chinese Short Text Matching
                                        Lu Chen, Yanbin Zhao , Boer Lyu , Lesheng Jin , Zhi Chen , Su Zhu , and Kai Yu
                                        In Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics, ACL 2020, Online, July 5-10, 2020 , Oct 2020
                                      30. Unsupervised Dual Paraphrasing for Two-stage Semantic Parsing
                                        Ruisheng Cao , Su Zhu , Chenyu Yang , Chen Liu , Rao Ma , Yanbin Zhao , Lu Chen, and Kai Yu
                                        In Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics, ACL 2020, Online, July 5-10, 2020 , Oct 2020
                                      31. Efficient Context and Schema Fusion Networks for Multi-Domain Dialogue State Tracking
                                        Su Zhu , Jieyu Li , Lu Chen, and Kai Yu
                                        In Findings of the Association for Computational Linguistics: EMNLP 2020, Online Event, 16-20 November 2020 , Oct 2020
                                      32. Duration Robust Weakly Supervised Sound Event Detection
                                        Heinrich Dinkel , and Kai Yu
                                        In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
                                      33. Investigation of Specaugment for Deep Speaker Embedding Learning
                                        Shuai Wang , Johan Rohdin , Oldrich Plchot , Lukás Burget , Kai Yu, and Jan Cernocký
                                        In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
                                      34. Speaker Augmentation for Low Resource Speech Recognition
                                        Chenpeng Du , and Kai Yu
                                        In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
                                      35. Neural Lattice Search for Speech Recognition
                                        Rao Ma , Hao Li , Qi Liu , Lu Chen, and Kai Yu
                                        In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
                                      36. A Hierarchical Tracker for Multi-Domain Dialogue State Tracking
                                        Jieyu Li , Su Zhu , and Kai Yu
                                        In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
                                      37. Addressing the Polysemy Problem in Language Modeling with Attentional Multi-Sense Embeddings
                                        Rao Ma , Lesheng Jin , Qi Liu , Lu Chen, and Kai Yu
                                        In 2020 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2020, Barcelona, Spain, May 4-8, 2020 , Oct 2020
                                      38. CODA: Improving Resource Utilization by Slimming and Co-locating DNN and CPU Jobs
                                        Han Zhao , Weihao Cui , Quan Chen , Jingwen Leng , Kai Yu, Deze Zeng , Chao Li , and Minyi Guo
                                        In 40th IEEE International Conference on Distributed Computing Systems, ICDCS 2020, Singapore, November 29 - December 1, 2020 , Oct 2020
                                      39. Jointly Encoding Word Confusion Network and Dialogue Context with BERT for Spoken Language Understanding
                                        Chen Liu , Su Zhu , Zijian Zhao , Ruisheng Cao , Lu Chen, and Kai Yu
                                        In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020 , Oct 2020
                                      40. Memory Attention Neural Network for Multi-domain Dialogue State Tracking
                                        Zihan Xu , Zhi Chen , Lu Chen , Su Zhu , and Kai Yu
                                        In Natural Language Processing and Chinese Computing - 9th CCF International Conference, NLPCC 2020, Zhengzhou, China, October 14-18, 2020, Proceedings, Part I , Oct 2020
                                      41. Robust Spoken Language Understanding with RL-Based Value Error Recovery
                                        Chen Liu , Su Zhu , Lu Chen, and Kai Yu
                                        In Natural Language Processing and Chinese Computing - 9th CCF International Conference, NLPCC 2020, Zhengzhou, China, October 14-18, 2020, Proceedings, Part I , Oct 2020
                                      42. An Investigation on Different Underlying Quantization Schemes for Pre-trained Language Models
                                        Zihan Zhao , Yuncong Liu , Lu Chen, Qi Liu , Rao Ma , and Kai Yu
                                        In Natural Language Processing and Chinese Computing - 9th CCF International Conference, NLPCC 2020, Zhengzhou, China, October 14-18, 2020, Proceedings, Part I , Oct 2020
                                      43. An Investigation on Deep Learning with Beta Stabilizer
                                        Qi Liu , Tian Tan , and Kai Yu
                                        CoRR, Oct 2020
                                      44. Vector Projection Network for Few-shot Slot Tagging in Natural Language Understanding
                                        Su Zhu , Ruisheng Cao , Lu Chen, and Kai Yu
                                        CoRR, Oct 2020
                                      45. Deep Reinforcement Learning for On-line Dialogue State Tracking
                                        Zhi Chen , Lu Chen, Xiang Zhou , and Kai Yu
                                        CoRR, Oct 2020
                                      46. Structured Hierarchical Dialogue Policy with Graph Neural Networks
                                        Zhi Chen , Xiaoyuan Liu , Lu Chen, and Kai Yu
                                        CoRR, Oct 2020
                                      47. Dual Learning for Dialogue State Tracking
                                        Zhi Chen , Lu Chen, Yanbin Zhao , Su Zhu , and Kai Yu
                                        CoRR, Oct 2020
                                      48. CREDIT: Coarse-to-Fine Sequence Generation for Dialogue State Tracking
                                        Zhi Chen , Lu Chen, Zihan Xu , Yanbin Zhao , Su Zhu , and Kai Yu
                                        CoRR, Oct 2020

                                      2019

                                      1. Erratum to: Past review, current progress, and challenges ahead on the cocktail party problem
                                        Yanmin Qian , Chao Weng , Xuankai Chang , Shuai Wang , and Dong Yu
                                        Frontiers Inf. Technol. Electron. Eng., Oct 2019
                                      2. Binary neural networks for speech recognition
                                        Yanmin Qian , and Xu Xiang
                                        Frontiers Inf. Technol. Electron. Eng., Oct 2019
                                      3. Data augmentation using generative adversarial networks for robust speech recognition
                                        Yanmin Qian , Hu Hu , and Tian Tan
                                        Speech Commun., Oct 2019
                                      4. Discriminative Neural Embedding Learning for Short-Duration Text-Independent Speaker Verification
                                        Shuai Wang , Zili Huang , Yanmin Qian , and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2019
                                      5. Margin Matters: Towards More Discriminative Deep Neural Network Embeddings for Speaker Recognition
                                        Xu Xiang , Shuai Wang , Houjun Huang , Yanmin Qian , and Kai Yu
                                        In 2019 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference, APSIPA ASC 2019, Lanzhou, China, November 18-21, 2019 , Oct 2019
                                      6. GANs for Children: A Generative Data Augmentation Strategy for Children Speech Recognition
                                        Peiyao Sheng , Zhuolin Yang , and Yanmin Qian
                                        In IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2019, Singapore, December 14-18, 2019 , Oct 2019
                                      7. MIMO-Speech: End-to-End Multi-Channel Multi-Speaker Speech Recognition
                                        Xuankai Chang , Wangyou Zhang , Yanmin Qian , Jonathan Le Roux , and Shinji Watanabe
                                        In IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2019, Singapore, December 14-18, 2019 , Oct 2019
                                      8. Exploring Model Units and Training Strategies for End-to-End Speech Recognition
                                        Mingkun Huang , Yizhou Lu , Lan Wang , Yanmin Qian , and Kai Yu
                                        In IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2019, Singapore, December 14-18, 2019 , Oct 2019
                                      9. End-to-End Overlapped Speech Detection and Speaker Counting with Raw Waveform
                                        Wangyou Zhang , Man Sun , Lan Wang , and Yanmin Qian
                                        In IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2019, Singapore, December 14-18, 2019 , Oct 2019
                                      10. Knowledge Distillation for Small Foot-print Deep Speaker Embedding
                                        Shuai Wang , Yexin Yang , Tianzhe Wang , Yanmin Qian , and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2019, Brighton, United Kingdom, May 12-17, 2019 , Oct 2019
                                      11. End-to-end Monaural Multi-speaker ASR System without Pretraining
                                        Xuankai Chang , Yanmin Qian , Kai Yu, and Shinji Watanabe
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2019, Brighton, United Kingdom, May 12-17, 2019 , Oct 2019
                                      12. The SJTU Robust Anti-Spoofing System for the ASVspoof 2019 Challenge
                                        Yexin Yang , Hongji Wang , Heinrich Dinkel , Zhengyang Chen , Shuai Wang , Yanmin Qian , and Kai Yu
                                        In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
                                      13. On the Usage of Phonetic Information for Text-Independent Speaker Embedding Extraction
                                        Shuai Wang , Johan Rohdin , Lukás Burget , Oldrich Plchot , Yanmin Qian , Kai Yu, and Jan Cernocký
                                        In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
                                      14. Data Augmentation Using Variational Autoencoder for Embedding Based Speaker Verification
                                        Zhanghao Wu , Shuai Wang , Yanmin Qian , and Kai Yu
                                        In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
                                      15. Joint Decoding of CTC Based Systems for Speech Recognition
                                        Jiaqi Guo , Yongbin You , Yanmin Qian , and Kai Yu
                                        In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
                                      16. Knowledge Distillation for End-to-End Monaural Multi-Talker ASR System
                                        Wangyou Zhang , Xuankai Chang , and Yanmin Qian
                                        In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
                                      17. Robust DOA Estimation Based on Convolutional Neural Network and Time-Frequency Masking
                                        Wangyou Zhang , Ying Zhou , and Yanmin Qian
                                        In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
                                      18. Cross-Domain Replay Spoofing Attack Detection Using Domain Adversarial Training
                                        Hongji Wang , Heinrich Dinkel , Shuai Wang , Yanmin Qian , and Kai Yu
                                        In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
                                      19. Prosody Usage Optimization for Children Speech Recognition with Zero Resource Children Speech
                                        Chenda Li , and Yanmin Qian
                                        In Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019 , Oct 2019
                                      20. Audio Caption: Listen and Tell
                                        Mengyue Wu, Heinrich Dinkel , and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2019, Brighton, United Kingdom, May 12-17, 2019 , Oct 2019
                                      21. Text-based Depression Detection: What Triggers An Alert
                                        Heinrich Dinkel , Mengyue Wu, and Kai Yu
                                        CoRR, Oct 2019
                                      22. What does a Car-ssette tape tell?
                                        Xuenan Xu , Heinrich Dinkel , Mengyue Wu, and Kai Yu
                                        CoRR, Oct 2019
                                      23. AgentGraph: Toward Universal Dialogue Management With Structured Deep Reinforcement Learning
                                        Lu Chen , Zhi Chen , Bowen Tan , Sishan Long , Milica Gasic , and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2019
                                      24. Semantic Parsing with Dual Learning
                                        Ruisheng Cao , Su Zhu , Chen Liu , Jieyu Li , and Kai Yu
                                        In Proceedings of the 57th Conference of the Association for Computational Linguistics, ACL 2019, Florence, Italy, July 28- August 2, 2019, Volume 1: Long Papers , Oct 2019
                                      25. Highly Efficient Neural Network Language Model Compression Using Soft Binarization Training
                                        Rao Ma , Qi Liu , and Kai Yu
                                        In IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2019, Singapore, December 14-18, 2019 , Oct 2019
                                      26. Data Augmentation with Atomic Templates for Spoken Language Understanding
                                        Zijian Zhao , Su Zhu , and Kai Yu
                                        In Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing and the 9th International Joint Conference on Natural Language Processing, EMNLP-IJCNLP 2019, Hong Kong, China, November 3-7, 2019 , Oct 2019
                                      27. A Hierarchical Decoding Model for Spoken Language Understanding from Unaligned Data
                                        Zijian Zhao , Su Zhu , and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2019, Brighton, United Kingdom, May 12-17, 2019 , Oct 2019
                                      28. CATSLU: The 1st Chinese Audio-Textual Spoken Language Understanding Challenge
                                        Su Zhu , Zijian Zhao , Tiejun Zhao , Chengqing Zong , and Kai Yu
                                        In International Conference on Multimodal Interaction, ICMI 2019, Suzhou, China, October 14-18, 2019 , Oct 2019
                                      29. Robust Spoken Language Understanding with Acoustic and Domain Knowledge
                                        Hao Li , Chen Liu , Su Zhu , and Kai Yu
                                        In International Conference on Multimodal Interaction, ICMI 2019, Suzhou, China, October 14-18, 2019 , Oct 2019
                                      30. Cross Aggregation of Multi-head Attention for Neural Machine Translation
                                        Juncheng Cao , Hai Zhao , and Kai Yu
                                        In Natural Language Processing and Chinese Computing - 8th CCF International Conference, NLPCC 2019, Dunhuang, China, October 9-14, 2019, Proceedings, Part I , Oct 2019
                                      31. International Conference on Multimodal Interaction, ICMI 2019, Suzhou, China, October 14-18, 2019
                                        Oct 2019

                                      2018

                                      1. Past review, current progress, and challenges ahead on the cocktail party problem
                                        Yanmin Qian , Chao Weng , Xuankai Chang , Shuai Wang , and Dong Yu
                                        Frontiers Inf. Technol. Electron. Eng., Oct 2018
                                      2. Erratum to: Past review, current progress, and challenges ahead on the cocktail party problem
                                        Yanmin Qian , Chao Weng , Xuankai Chang , Shuai Wang , and Dong Yu
                                        Frontiers Inf. Technol. Electron. Eng., Oct 2018
                                      3. Sequence discriminative training for deep learning based acoustic keyword spotting
                                        Zhehuai Chen , Yanmin Qian , and Kai Yu
                                        Speech Commun., Oct 2018
                                      4. Single-channel multi-talker speech recognition with permutation invariant training
                                        Yanmin Qian , Xuankai Chang , and Dong Yu
                                        Speech Commun., Oct 2018
                                      5. Adaptive Very Deep Convolutional Residual Network for Noise Robust Speech Recognition
                                        Tian Tan , Yanmin Qian , Hu Hu , Ying Zhou , Wen Ding , and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2018
                                      6. Investigating Raw Wave Deep Neural Networks for End-to-End Speaker Spoofing Detection
                                        Heinrich Dinkel , Yanmin Qian , and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2018
                                      7. Robust Mask Estimation By Integrating Neural Network-Based and Clustering-Based Approaches for Adaptive Acoustic Beamforming
                                        Ying Zhou , and Yanmin Qian
                                        In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
                                      8. Knowledge Transfer in Permutation Invariant Training for Single-Channel Multi-Talker Speech Recognition
                                        Tian Tan , Yanmin Qian , and Dong Yu
                                        In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
                                      9. Joint I-Vector with End-to-End System for Short Duration Text-Independent Speaker Verification
                                        Zili Huang , Shuai Wang , and Yanmin Qian
                                        In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
                                      10. Generative Adversarial Networks Based Data Augmentation for Noise Robust Speech Recognition
                                        Hu Hu , Tian Tan , and Yanmin Qian
                                        In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
                                      11. Focal Kl-Divergence Based Dilated Convolutional Neural Networks for Co-Channel Speaker Identification
                                        Shuai Wang , Yanmin Qian , and Kai Yu
                                        In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
                                      12. Noise Robust Speech Recognition on Aurora4 by Humans and Machines
                                        Yanmin Qian , Tian Tan , Hu Hu , and Qi Liu
                                        In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
                                      13. Fast Adaptation on Deepmixture Generative Network Based Acoustic Modeling
                                        Wen Ding , Tian Tan , and Yanmin Qian
                                        In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
                                      14. Adaptive Permutation Invariant Training with Auxiliary Information for Monaural Multi-Talker Speech Recognition
                                        Xuankai Chang , Yanmin Qian , and Dong Yu
                                        In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
                                      15. Permutation Invariant Training of Generative Adversarial Network for Monaural Speech Separation
                                        Lianwu Chen , Meng Yu , Yanmin Qian , Dan Su , and Dong Yu
                                        In Interspeech 2018, 19th Annual Conference of the International Speech Communication Association, Hyderabad, India, 2-6 September 2018 , Oct 2018
                                      16. Deep Extractor Network for Target Speaker Recovery from Single Channel Speech Mixtures
                                        Jun Wang , Jie Chen , Dan Su , Lianwu Chen , Meng Yu , Yanmin Qian , and Dong Yu
                                        In Interspeech 2018, 19th Annual Conference of the International Speech Communication Association, Hyderabad, India, 2-6 September 2018 , Oct 2018
                                      17. Monaural Multi-Talker Speech Recognition with Attention Mechanism and Gated Convolutional Networks
                                        Xuankai Chang , Yanmin Qian , and Dong Yu
                                        In Interspeech 2018, 19th Annual Conference of the International Speech Communication Association, Hyderabad, India, 2-6 September 2018 , Oct 2018
                                      18. Knowledge Distillation for Sequence Model
                                        Mingkun Huang , Yongbin You , Zhehuai Chen , Yanmin Qian , and Kai Yu
                                        In Interspeech 2018, 19th Annual Conference of the International Speech Communication Association, Hyderabad, India, 2-6 September 2018 , Oct 2018
                                      19. Covariance Based Deep Feature for Text-Dependent Speaker Verification
                                        Shuai Wang , Heinrich Dinkel , Yanmin Qian , and Kai Yu
                                        In Intelligence Science and Big Data Engineering - 8th International Conference, IScIDE 2018, Lanzhou, China, August 18-19, 2018, Revised Selected Papers , Oct 2018
                                      20. Data Augmentation using Conditional Generative Adversarial Networks for Robust Speech Recognition
                                        Peiyao Sheng , Zhuolin Yang , Hu Hu , Tian Tan , and Yanmin Qian
                                        In 11th International Symposium on Chinese Spoken Language Processing, ISCSLP 2018, Taipei City, Taiwan, November 26-29, 2018 , Oct 2018
                                      21. Deep Discriminant Analysis for i-vector Based Robust Speaker Recognition
                                        Shuai Wang , Zili Huang , Yanmin Qian , and Kai Yu
                                        In 11th International Symposium on Chinese Spoken Language Processing, ISCSLP 2018, Taipei City, Taiwan, November 26-29, 2018 , Oct 2018
                                      22. Generative Adversarial Networks based X-vector Augmentation for Robust Probabilistic Linear Discriminant Analysis in Speaker Verification
                                        Yexin Yang , Shuai Wang , Man Sun , Yanmin Qian , and Kai Yu
                                        In 11th International Symposium on Chinese Spoken Language Processing, ISCSLP 2018, Taipei City, Taiwan, November 26-29, 2018 , Oct 2018
                                      23. Rich Short Text Conversation Using Semantic-Key-Controlled Sequence Generation
                                        Kai Yu, Zijian Zhao , Xueyang Wu , Hongtao Lin , and Xuan Liu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2018
                                      24. Structured Dialogue Policy with Graph Neural Networks
                                        Lu Chen, Bowen Tan , Sishan Long , and Kai Yu
                                        In Proceedings of the 27th International Conference on Computational Linguistics, COLING 2018, Santa Fe, New Mexico, USA, August 20-26, 2018 , Oct 2018
                                      25. Towards Universal Dialogue State Tracking
                                        Liliang Ren , Kaige Xie , Lu Chen, and Kai Yu
                                        In Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing, Brussels, Belgium, October 31 - November 4, 2018 , Oct 2018
                                      26. On Modular Training of Neural Acoustics-to-Word Model for LVCSR
                                        Zhehuai Chen , Qi Liu , Hao Li , and Kai Yu
                                        In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
                                      27. Semi-Supervised Training Using Adversarial Multi-Task Learning for Spoken Language Understanding
                                        Ouyu Lan , Su Zhu , and Kai Yu
                                        In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
                                      28. Policy Adaptation for Deep Reinforcement Learning-Based Dialogue Management
                                        Lu Chen, Cheng Chang , Zhi Chen , Bowen Tan , Milica Gasic , and Kai Yu
                                        In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
                                      29. Robust Spoken Language Understanding with Unsupervised ASR-Error Adaptation
                                        Su Zhu , Ouyu Lan , and Kai Yu
                                        In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2018, Calgary, AB, Canada, April 15-20, 2018 , Oct 2018
                                      30. MLN: Moment localization Network and Samples Selection for Moment Retrieval
                                        Bo Huang , Ya Zhang , and Kai Yu
                                        In Proceedings of the 2nd International Conference on Video and Image Processing, ICVIP 2018, Hong Kong, China, December 29-31, 2018 , Oct 2018
                                      31. Angular Softmax for Short-Duration Text-independent Speaker Verification
                                        Zili Huang , Shuai Wang , and Kai Yu
                                        In Interspeech 2018, 19th Annual Conference of the International Speech Communication Association, Hyderabad, India, 2-6 September 2018 , Oct 2018
                                      32. Joint Spoken Language Understanding and Domain Adaptive Language Modeling
                                        Huifeng Zhang , Su Zhu , Shuai Fan , and Kai Yu
                                        In Intelligence Science and Big Data Engineering - 8th International Conference, IScIDE 2018, Lanzhou, China, August 18-19, 2018, Revised Selected Papers , Oct 2018
                                      33. Binarized LSTM Language Model
                                        Xuan Liu , Di Cao , and Kai Yu
                                        In Proceedings of the 2018 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, NAACL-HLT 2018, New Orleans, Louisiana, USA, June 1-6, 2018, Volume 1 (Long Papers) , Oct 2018
                                      34. Cost-Sensitive Active Learning for Dialogue State Tracking
                                        Kaige Xie , Cheng Chang , Liliang Ren , Lu Chen, and Kai Yu
                                        In Proceedings of the 19th Annual SIGdial Meeting on Discourse and Dialogue, Melbourne, Australia, July 12-14, 2018 , Oct 2018
                                      35. Concept Transfer Learning for Adaptive Language Understanding
                                        Su Zhu , and Kai Yu
                                        In Proceedings of the 19th Annual SIGdial Meeting on Discourse and Dialogue, Melbourne, Australia, July 12-14, 2018 , Oct 2018
                                      36. Intelligence Science and Big Data Engineering - 8th International Conference, IScIDE 2018, Lanzhou, China, August 18-19, 2018, Revised Selected Papers
                                        Oct 2018

                                      2017

                                      1. Phone Synchronous Speech Recognition With CTC Lattices
                                        Zhehuai Chen , Yimeng Zhuang , Yanmin Qian , and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2017
                                      2. Deep Feature Engineering for Noise Robust Spoofing Detection
                                        Yanmin Qian , Nanxin Chen , Heinrich Dinkel , and Zhizheng Wu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2017
                                      3. Integrating online i-vector into GMM-UBM for text-dependent speaker verification
                                        Xiaowei Jiang , Shuai Wang , Xu Xiang , and Yanmin Qian
                                        In 2017 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference, APSIPA ASC 2017, Kuala Lumpur, Malaysia, December 12-15, 2017 , Oct 2017
                                      4. Future vector enhanced LSTM language model for LVCSR
                                        Qi Liu , Yanmin Qian , and Kai Yu
                                        In 2017 IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2017, Okinawa, Japan, December 16-20, 2017 , Oct 2017
                                      5. Multi-view LSTM Language Model with Word-Synchronized Auxiliary Feature for LVCSR
                                        Yue Wu , Tianxing He , Zhehuai Chen , Yanmin Qian , and Kai Yu
                                        In Chinese Computational Linguistics and Natural Language Processing Based on Naturally Annotated Big Data - 16th China National Conference, CCL 2017, - and - 5th International Symposium, NLP-NABD 2017, Nanjing, China, October 13-15, 2017, Proceedings , Oct 2017
                                      6. End-to-end spoofing detection with raw waveform CLDNNS
                                        Heinrich Dinkel , Nanxin Chen , Yanmin Qian , and Kai Yu
                                        In 2017 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2017, New Orleans, LA, USA, March 5-9, 2017 , Oct 2017
                                      7. Small-footprint convolutional neural network for spoofing detection
                                        Heinrich Dinkel , Yanmin Qian , and Kai Yu
                                        In 2017 International Joint Conference on Neural Networks, IJCNN 2017, Anchorage, AK, USA, May 14-19, 2017 , Oct 2017
                                      8. Binary Deep Neural Networks for Speech Recognition
                                        Xu Xiang , Yanmin Qian , and Kai Yu
                                        In Interspeech 2017, 18th Annual Conference of the International Speech Communication Association, Stockholm, Sweden, August 20-24, 2017 , Oct 2017
                                      9. What Does the Speaker Embedding Encode?
                                        Shuai Wang , Yanmin Qian , and Kai Yu
                                        In Interspeech 2017, 18th Annual Conference of the International Speech Communication Association, Stockholm, Sweden, August 20-24, 2017 , Oct 2017
                                      10. Recognizing Multi-Talker Speech with Permutation Invariant Training
                                        Dong Yu , Xuankai Chang , and Yanmin Qian
                                        In Interspeech 2017, 18th Annual Conference of the International Speech Communication Association, Stockholm, Sweden, August 20-24, 2017 , Oct 2017
                                      11. A Unified Confidence Measure Framework Using Auxiliary Normalization Graph
                                        Zhehuai Chen , Yanmin Qian , and Kai Yu
                                        In Intelligence Science and Big Data Engineering - 7th International Conference, IScIDE 2017, Dalian, China, September 22-23, 2017, Proceedings , Oct 2017
                                      12. Adaptation of Deep Neural Network Acoustic Models for Robust Automatic Speech Recognition
                                        Khe Chai Sim , Yanmin Qian , Gautam Mantena , Lahiru Samarakoon , Souvik Kundu , and Tian Tan
                                        In New Era for Robust Speech Recognition, Exploiting Deep Learning , Oct 2017
                                      13. On-line Dialogue Policy Learning with Companion Teaching
                                        Lu Chen, Runzhe Yang , Cheng Chang , Zihao Ye , Xiang Zhou , and Kai Yu
                                        In Proceedings of the 15th Conference of the European Chapter of the Association for Computational Linguistics, EACL 2017, Valencia, Spain, April 3-7, 2017, Volume 2: Short Papers , Oct 2017
                                      14. Affordable On-line Dialogue Policy Learning
                                        Cheng Chang , Runzhe Yang , Lu Chen, Xiang Zhou , and Kai Yu
                                        In Proceedings of the 2017 Conference on Empirical Methods in Natural Language Processing, EMNLP 2017, Copenhagen, Denmark, September 9-11, 2017 , Oct 2017
                                      15. Agent-Aware Dropout DQN for Safe and Efficient On-line Dialogue Policy Learning
                                        Lu Chen, Xiang Zhou , Cheng Chang , Runzhe Yang , and Kai Yu
                                        In Proceedings of the 2017 Conference on Empirical Methods in Natural Language Processing, EMNLP 2017, Copenhagen, Denmark, September 9-11, 2017 , Oct 2017
                                      16. Confidence measures for CTC-based phone synchronous decoding
                                        Zhehuai Chen , Yimeng Zhuang , and Kai Yu
                                        In 2017 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2017, New Orleans, LA, USA, March 5-9, 2017 , Oct 2017
                                      17. Encoder-decoder with focus-mechanism for sequence labelling based spoken language understanding
                                        Su Zhu , and Kai Yu
                                        In 2017 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2017, New Orleans, LA, USA, March 5-9, 2017 , Oct 2017
                                      18. Discrete Duration Model for Speech Synthesis
                                        Bo Chen , Tianling Bian , and Kai Yu
                                        In Interspeech 2017, 18th Annual Conference of the International Speech Communication Association, Stockholm, Sweden, August 20-24, 2017 , Oct 2017
                                      19. Deep Attentive Structured Language Model Based on LSTM
                                        Di Cao , and Kai Yu
                                        In Intelligence Science and Big Data Engineering - 7th International Conference, IScIDE 2017, Dalian, China, September 22-23, 2017, Proceedings , Oct 2017
                                      20. splab at the NTCIR-13 STC-2 Task
                                        Xuan Liu , Xueyang Wu , Ruinian Chen , Zijian Zhao , Hongtao Lin , and Kai Yu
                                        In The 13th NTCIR Conference, Evaluation of Information Access Technologies, National Center of Sciences, Tokyo, Japan, December 5-8, 2017 , Oct 2017

                                      2016

                                      1. Deep features for automatic spoofing detection
                                        Yanmin Qian , Nanxin Chen , and Kai Yu
                                        Speech Commun., Oct 2016
                                      2. Cluster Adaptive Training for Deep Neural Network Based Acoustic Model
                                        Tian Tan , Yanmin Qian , and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2016
                                      3. Neural Network Based Multi-Factor Aware Joint Training for Robust Speech Recognition
                                        Yanmin Qian , Tian Tan , and Dong Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2016
                                      4. Very Deep Convolutional Neural Networks for Noise Robust Speech Recognition
                                        Yanmin Qian , Mengxiao Bi , Tian Tan , and Kai Yu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2016
                                      5. Overview of BTAS 2016 speaker anti-spoofing competition
                                        Pavel Korshunov , Sébastien Marcel , Hannah Muckenhirn , André R. Gonçalves , A. G. Souza Mello , Ricardo Paranhos Velloso Violato , Flávio Olmos Simões , M. U. Neto , Marcus Assis Angeloni , José Augusto Stuchi , Heinrich Dinkel , Nanxin Chen , Yanmin Qian , Dipjyoti Paul , Goutam Saha , and Md. Sahidullah
                                        In 8th IEEE International Conference on Biometrics Theory, Applications and Systems, BTAS 2016, Niagara Falls, NY, USA, September 6-9, 2016 , Oct 2016
                                      6. Joint acoustic factor learning for robust deep neural network based automatic speech recognition
                                        Souvik Kundu , Gautam Mantena , Yanmin Qian , Tian Tan , Marc Delcroix , and Khe Chai Sim
                                        In 2016 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2016, Shanghai, China, March 20-25, 2016 , Oct 2016
                                      7. Speaker-aware training of LSTM-RNNS for acoustic modelling
                                        Tian Tan , Yanmin Qian , Dong Yu , Souvik Kundu , Liang Lu , Khe Chai Sim , Xiong Xiao , and Yu Zhang
                                        In 2016 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2016, Shanghai, China, March 20-25, 2016 , Oct 2016
                                      8. Improved DNN-based segmentation for multi-genre broadcast audio
                                        Linlin Wang , Chao Zhang , Philip C. Woodland , Mark J. F. Gales , Panagiota Karanasou , Pierre Lanchantin , Xunying Liu , and Yanmin Qian
                                        In 2016 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2016, Shanghai, China, March 20-25, 2016 , Oct 2016
                                      9. An investigation into using parallel data for far-field speech recognition
                                        Yanmin Qian , Tian Tan , and Dong Yu
                                        In 2016 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2016, Shanghai, China, March 20-25, 2016 , Oct 2016
                                      10. Integrated adaptation with multi-factor joint-learning for far-field speech recognition
                                        Yanmin Qian , Tian Tan , Dong Yu , and Yu Zhang
                                        In 2016 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2016, Shanghai, China, March 20-25, 2016 , Oct 2016
                                      11. Unrestricted Vocabulary Keyword Spotting Using LSTM-CTC
                                        Yimeng Zhuang , Xuankai Chang , Yanmin Qian , and Kai Yu
                                        In Interspeech 2016, 17th Annual Conference of the International Speech Communication Association, San Francisco, CA, USA, September 8-12, 2016 , Oct 2016
                                      12. Multi-task joint-learning for robust voice activity detection
                                        Yimeng Zhuang , Sibo Tong , Maofan Yin , Yanmin Qian , and Kai Yu
                                        In 10th International Symposium on Chinese Spoken Language Processing, ISCSLP 2016, Tianjin, China, October 17-20, 2016 , Oct 2016
                                      13. Very deep convolutional neural networks for robust speech recognition
                                        Yanmin Qian , and Philip C. Woodland
                                        In 2016 IEEE Spoken Language Technology Workshop, SLT 2016, San Diego, CA, USA, December 13-16, 2016 , Oct 2016
                                      14. Evolvable dialogue state tracking for statistical dialogue management
                                        Kai YuLu Chen, Kai Sun , Qizhe Xie , and Su Zhu
                                        Frontiers Comput. Sci., Oct 2016
                                      15. Discriminatively trained joint speaker and environment representations for adaptation of deep neural network acoustic models
                                        Maofan Yin , Sunil Sivadas , Kai Yu, and Bin Ma
                                        In 2016 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2016, Shanghai, China, March 20-25, 2016 , Oct 2016
                                      16. A comparative study of robustness of deep learning approaches for VAD
                                        Sibo Tong , Hao Gu , and Kai Yu
                                        In 2016 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2016, Shanghai, China, March 20-25, 2016 , Oct 2016
                                      17. Phone Synchronous Decoding with CTC Lattice
                                        Zhehuai Chen , Wei Deng , Tao Xu , and Kai Yu
                                        In Interspeech 2016, 17th Annual Conference of the International Speech Communication Association, San Francisco, CA, USA, September 8-12, 2016 , Oct 2016
                                      18. Hybrid Dialogue State Tracking for Real World Human-to-Human Dialogues
                                        Kai Sun , Su Zhu , Lu Chen, Siqiu Yao , Xueyang Wu , and Kai Yu
                                        In Interspeech 2016, 17th Annual Conference of the International Speech Communication Association, San Francisco, CA, USA, September 8-12, 2016 , Oct 2016
                                      19. On training bi-directional neural network language model with noise contrastive estimation
                                        Tianxing He , Yu Zhang , Jasha Droppo , and Kai Yu
                                        In 10th International Symposium on Chinese Spoken Language Processing, ISCSLP 2016, Tianjin, China, October 17-20, 2016 , Oct 2016
                                      20. Rich punctuations prediction using large-scale deep learning
                                        Xueyang Wu , Su Zhu , Yue Wu , and Kai Yu
                                        In 10th International Symposium on Chinese Spoken Language Processing, ISCSLP 2016, Tianjin, China, October 17-20, 2016 , Oct 2016
                                      21. Directed automatic speech transcription error correction using bidirectional LSTM
                                        Da Zheng , Zhehuai Chen , Yue Wu , and Kai Yu
                                        In 10th International Symposium on Chinese Spoken Language Processing, ISCSLP 2016, Tianjin, China, October 17-20, 2016 , Oct 2016
                                      22. The splab at the NTCIR-12 Short Text Conversation Task
                                        Ke Wu , Xuan Liu , and Kai Yu
                                        In Proceedings of the 12th NTCIR Conference on Evaluation of Information Access Technologies, National Center of Sciences, Tokyo, Japan, June 7-10, 2016 , Oct 2016

                                      2015

                                      1. Deep feature for text-dependent speaker verification
                                        Yuan Liu , Yanmin Qian , Nanxin Chen , Tianfan Fu , Ya Zhang , and Kai Yu
                                        Speech Commun., Oct 2015
                                      2. Multi-task joint-learning of deep neural networks for robust speech recognition
                                        Yanmin Qian , Maofan Yin , Yongbin You , and Kai Yu
                                        In 2015 IEEE Workshop on Automatic Speech Recognition and Understanding, ASRU 2015, Scottsdale, AZ, USA, December 13-17, 2015 , Oct 2015
                                      3. Cambridge university transcription systems for the multi-genre broadcast challenge
                                        Philip C. Woodland , Xunying Liu , Yanmin Qian , Chao Zhang , Mark J. F. Gales , Penny Karanasou , Pierre Lanchantin , and Linlin Wang
                                        In 2015 IEEE Workshop on Automatic Speech Recognition and Understanding, ASRU 2015, Scottsdale, AZ, USA, December 13-17, 2015 , Oct 2015
                                      4. The development of the cambridge university alignment systems for the multi-genre broadcast challenge
                                        Pierre Lanchantin , Mark J. F. Gales , Penny Karanasou , Xunying Liu , Yanmin Qian , Linlin Wang , Philip C. Woodland , and Chao Zhang
                                        In 2015 IEEE Workshop on Automatic Speech Recognition and Understanding, ASRU 2015, Scottsdale, AZ, USA, December 13-17, 2015 , Oct 2015
                                      5. Speaker diarisation and longitudinal linking in multi-genre broadcast data
                                        Penny Karanasou , Mark J. F. Gales , Pierre Lanchantin , Xunying Liu , Yanmin Qian , Linlin Wang , Philip C. Woodland , and Chao Zhang
                                        In 2015 IEEE Workshop on Automatic Speech Recognition and Understanding, ASRU 2015, Scottsdale, AZ, USA, December 13-17, 2015 , Oct 2015
                                      6. Local trajectory based speech enhancement for robust speech recognition with deep neural network
                                        Yongbin You , Yanmin Qian , and Kai Yu
                                        In IEEE China Summit and International Conference on Signal and Information Processing, ChinaSIP 2015, Chengdu, China, July 12-15, 2015 , Oct 2015
                                      7. An investigation on DNN-derived bottleneck features for GMM-HMM based robust speech recognition
                                        Yongbin You , Yanmin Qian , Tianxing He , and Kai Yu
                                        In IEEE China Summit and International Conference on Signal and Information Processing, ChinaSIP 2015, Chengdu, China, July 12-15, 2015 , Oct 2015
                                      8. Cluster adaptive training for deep neural network
                                        Tian Tan , Yanmin Qian , Maofan Yin , Yimeng Zhuang , and Kai Yu
                                        In 2015 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2015, South Brisbane, Queensland, Australia, April 19-24, 2015 , Oct 2015
                                      9. A novel static parameter calculation method for model compensation
                                        Suliang Bu , Yunxin Zhao , Yanmin Qian , and Kai Yu
                                        In 2015 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2015, South Brisbane, Queensland, Australia, April 19-24, 2015 , Oct 2015
                                      10. Recurrent neural network language model with structured word embeddings for speech recognition
                                        Tianxing He , Xu Xiang , Yanmin Qian , and Kai Yu
                                        In 2015 IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2015, South Brisbane, Queensland, Australia, April 19-24, 2015 , Oct 2015
                                      11. Automatic model redundancy reduction for fast back-propagation for deep neural networks in speech recognition
                                        Yanmin Qian , Tianxing He , Wei Deng , and Kai Yu
                                        In 2015 International Joint Conference on Neural Networks, IJCNN 2015, Killarney, Ireland, July 12-17, 2015 , Oct 2015
                                      12. Multi-task learning for text-dependent speaker verification
                                        Nanxin Chen , Yanmin Qian , and Kai Yu
                                        In INTERSPEECH 2015, 16th Annual Conference of the International Speech Communication Association, Dresden, Germany, September 6-10, 2015 , Oct 2015
                                      13. Robust deep feature for spoofing detection - the SJTU system for ASVspoof 2015 challenge
                                        Nanxin Chen , Yanmin Qian , Heinrich Dinkel , Bo Chen , and Kai Yu
                                        In INTERSPEECH 2015, 16th Annual Conference of the International Speech Communication Association, Dresden, Germany, September 6-10, 2015 , Oct 2015
                                      14. Very deep convolutional neural networks for LVCSR
                                        Mengxiao Bi , Yanmin Qian , and Kai Yu
                                        In INTERSPEECH 2015, 16th Annual Conference of the International Speech Communication Association, Dresden, Germany, September 6-10, 2015 , Oct 2015
                                      15. Paragraph vector based topic model for language model adaptation
                                        Wengong Jin , Tianxing He , Yanmin Qian , and Kai Yu
                                        In INTERSPEECH 2015, 16th Annual Conference of the International Speech Communication Association, Dresden, Germany, September 6-10, 2015 , Oct 2015
                                      16. Constrained Markov Bayesian Polynomial for Efficient Dialogue State Tracking
                                        Kai Yu, Kai Sun , Lu Chen , and Su Zhu
                                        IEEE ACM Trans. Audio Speech Lang. Process., Oct 2015
                                      17. An investigation of context clustering for statistical speech synthesis with deep neural network
                                        Bo Chen , Zhehuai Chen , Jiachen Xu , and Kai Yu
                                        In INTERSPEECH 2015, 16th Annual Conference of the International Speech Communication Association, Dresden, Germany, September 6-10, 2015 , Oct 2015
                                      18. Recurrent Polynomial Network for Dialogue State Tracking with Mismatched Semantic Parsers
                                        Qizhe Xie , Kai Sun , Su Zhu , Lu Chen, and Kai Yu
                                        In Proceedings of the SIGDIAL 2015 Conference, The 16th Annual Meeting of the Special Interest Group on Discourse and Dialogue, 2-4 September 2015, Prague, Czech Republic , Oct 2015
                                      19. Hyper-parameter Optimisation of Gaussian Process Reinforcement Learning for Statistical Dialogue Management
                                        Lu Chen, Pei-Hao Su , and Milica Gasic
                                        In Proceedings of the SIGDIAL 2015 Conference, The 16th Annual Meeting of the Special Interest Group on Discourse and Dialogue, 2-4 September 2015, Prague, Czech Republic , Oct 2015

                                      2014

                                      1. Stochastic data sweeping for fast DNN training
                                        Wei Deng , Yanmin Qian , Yuchen Fan , Tianfan Fu , and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2014, Florence, Italy, May 4-9, 2014 , Oct 2014
                                      2. Reshaping deep neural network for fast decoding by node-pruning
                                        Tianxing He , Yuchen Fan , Yanmin Qian , Tian Tan , and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2014, Florence, Italy, May 4-9, 2014 , Oct 2014
                                      3. Second order vector taylor series based robust speech recognition
                                        Suliang Bu , Yanmin Qian , Khe Chai Sim , Yongbin You , and Kai Yu
                                        In IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2014, Florence, Italy, May 4-9, 2014 , Oct 2014
                                      4. Speaker verification with deep features
                                        Yuan Liu , Tianfan Fu , Yuchen Fan , Yanmin Qian , and Kai Yu
                                        In 2014 International Joint Conference on Neural Networks, IJCNN 2014, Beijing, China, July 6-11, 2014 , Oct 2014
                                      5. Tandem deep features for text-dependent speaker verification
                                        Tianfan Fu , Yanmin Qian , Yuan Liu , and Kai Yu
                                        In INTERSPEECH 2014, 15th Annual Conference of the International Speech Communication Association, Singapore, September 14-18, 2014 , Oct 2014
                                      6. A novel dynamic parameters calculation approach for model compensation
                                        Suliang Bu , Yanmin Qian , and Kai Yu
                                        In INTERSPEECH 2014, 15th Annual Conference of the International Speech Communication Association, Singapore, September 14-18, 2014 , Oct 2014
                                      7. Acoustic emotion recognition using deep neural network
                                        Jianwei Niu , Yanmin Qian , and Kai Yu
                                        In The 9th International Symposium on Chinese Spoken Language Processing, Singapore, September 12-14, 2014 , Oct 2014
                                      8. The SJTU System for Dialog State Tracking Challenge 2
                                        Kai Sun , Lu Chen , Su Zhu , and Kai Yu
                                        In Proceedings of the SIGDIAL 2014 Conference, The 15th Annual Meeting of the Special Interest Group on Discourse and Dialogue, 18-20 June 2014, Philadelphia, PA, USA , Oct 2014
                                      9. A generalized rule based tracker for dialogue state tracking
                                        Kai Sun , Lu Chen , Su Zhu , and Kai Yu
                                        In 2014 IEEE Spoken Language Technology Workshop, SLT 2014, South Lake Tahoe, NV, USA, December 7-10, 2014 , Oct 2014
                                      10. Semantic parser enhancement for dialogue domain extension with little data
                                        Su Zhu , Lu Chen, Kai Sun , Da Zheng , and Kai Yu
                                        In 2014 IEEE Spoken Language Technology Workshop, SLT 2014, South Lake Tahoe, NV, USA, December 7-10, 2014 , Oct 2014

                                      2013

                                      1. Combination of data borrowing strategies for low-resource LVCSR
                                        Yanmin Qian , Kai Yu, and Jia Liu
                                        In 2013 IEEE Workshop on Automatic Speech Recognition and Understanding, Olomouc, Czech Republic, December 8-12, 2013 , Oct 2013
                                      2. MLP-HMM two-stage unsupervised training for low-resource languages on conversational telephone speech recognition
                                        Yanmin Qian , and Jia Liu
                                        In INTERSPEECH 2013, 14th Annual Conference of the International Speech Communication Association, Lyon, France, August 25-29, 2013 , Oct 2013
                                      3. A New Word Language Model Evaluation Metric for Character Based Languages
                                        Peilu Wang , Ruihua Sun , Hai Zhao , and Kai Yu
                                        In Chinese Computational Linguistics and Natural Language Processing Based on Naturally Annotated Big Data - 12th China National Conference, CCL 2013 and First International Symposium, NLP-NABD 2013, Suzhou, China, October 10-12, 2013. Proceedings , Oct 2013

                                      2012

                                      1. Introduction to the Issue on Advances in Spoken Dialogue Systems and Mobile Interface
                                        Jason D. Williams , Kai Yu, Brahim Chaib-draa , Oliver Lemon , Roberto Pieraccini , Olivier Pietquin , Pascal Poupart , and Steve J. Young
                                        IEEE J. Sel. Top. Signal Process., Oct 2012
                                      2. ICMI’12 grand challenge: haptic voice recognition
                                        Khe Chai Sim , Shengdong Zhao , Kai Yu, and Hank Liao
                                        In International Conference on Multimodal Interaction, ICMI ’12, Santa Monica, CA, USA, October 22-26, 2012 , Oct 2012
                                      3. Development of the 2012 SJTU HVR system
                                        Hainan Xu , Yuchen Fan , and Kai Yu
                                        In International Conference on Multimodal Interaction, ICMI ’12, Santa Monica, CA, USA, October 22-26, 2012 , Oct 2012
                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file diff --git a/zh/projects/1_project/index.html b/zh/projects/1_project/index.html index 5759bb36ea50..bd2575502a75 100644 --- a/zh/projects/1_project/index.html +++ b/zh/projects/1_project/index.html @@ -1,4 +1,4 @@ - project 1 | X - LANCE

                                      project 1

                                      a project with a background image

                                      Every project has a beautiful feature showcase page. It’s easy to include images in a flexible 3-column grid format. Make your photos 1/3, 2/3, or full width.

                                      To give your project a background in the portfolio page, just add the img tag to the front matter like so:

                                      ---
                                      +        project 1 | X - LANCE                  

                                      project 1

                                      a project with a background image

                                      Every project has a beautiful feature showcase page. It’s easy to include images in a flexible 3-column grid format. Make your photos 1/3, 2/3, or full width.

                                      To give your project a background in the portfolio page, just add the img tag to the front matter like so:

                                      ---
                                       layout: page
                                       title: project
                                       description: a project with a background image
                                      diff --git a/zh/projects/2_project/index.html b/zh/projects/2_project/index.html
                                      index c45a2b64cb67..d67a19798465 100644
                                      --- a/zh/projects/2_project/index.html
                                      +++ b/zh/projects/2_project/index.html
                                      @@ -1,4 +1,4 @@
                                      -        project 2 | X - LANCE                  

                                      project 2

                                      a project with a background image and giscus comments

                                      Every project has a beautiful feature showcase page. It’s easy to include images in a flexible 3-column grid format. Make your photos 1/3, 2/3, or full width.

                                      To give your project a background in the portfolio page, just add the img tag to the front matter like so:

                                      ---
                                      +        project 2 | X - LANCE                  

                                      project 2

                                      a project with a background image and giscus comments

                                      Every project has a beautiful feature showcase page. It’s easy to include images in a flexible 3-column grid format. Make your photos 1/3, 2/3, or full width.

                                      To give your project a background in the portfolio page, just add the img tag to the front matter like so:

                                      ---
                                       layout: page
                                       title: project
                                       description: a project with a background image
                                      diff --git a/zh/projects/3_project/index.html b/zh/projects/3_project/index.html
                                      index 7a4bac98df34..0fc6c6284206 100644
                                      --- a/zh/projects/3_project/index.html
                                      +++ b/zh/projects/3_project/index.html
                                      @@ -1,4 +1,4 @@
                                      -         project 3 | X - LANCE                  

                                      project 3

                                      a project that redirects to another website

                                      Every project has a beautiful feature showcase page. It’s easy to include images in a flexible 3-column grid format. Make your photos 1/3, 2/3, or full width.

                                      To give your project a background in the portfolio page, just add the img tag to the front matter like so:

                                      ---
                                      +         project 3 | X - LANCE                  

                                      project 3

                                      a project that redirects to another website

                                      Every project has a beautiful feature showcase page. It’s easy to include images in a flexible 3-column grid format. Make your photos 1/3, 2/3, or full width.

                                      To give your project a background in the portfolio page, just add the img tag to the front matter like so:

                                      ---
                                       layout: page
                                       title: project
                                       description: a project with a background image
                                      diff --git a/zh/projects/4_project/index.html b/zh/projects/4_project/index.html
                                      index bfe11bc4c279..688ab4b4b80b 100644
                                      --- a/zh/projects/4_project/index.html
                                      +++ b/zh/projects/4_project/index.html
                                      @@ -1,4 +1,4 @@
                                      -        project 4 | X - LANCE                  

                                      project 4

                                      another without an image

                                      Every project has a beautiful feature showcase page. It’s easy to include images in a flexible 3-column grid format. Make your photos 1/3, 2/3, or full width.

                                      To give your project a background in the portfolio page, just add the img tag to the front matter like so:

                                      ---
                                      +        project 4 | X - LANCE                  

                                      project 4

                                      another without an image

                                      Every project has a beautiful feature showcase page. It’s easy to include images in a flexible 3-column grid format. Make your photos 1/3, 2/3, or full width.

                                      To give your project a background in the portfolio page, just add the img tag to the front matter like so:

                                      ---
                                       layout: page
                                       title: project
                                       description: a project with a background image
                                      diff --git a/zh/projects/5_project/index.html b/zh/projects/5_project/index.html
                                      index a80967566cd7..34bb21b106c4 100644
                                      --- a/zh/projects/5_project/index.html
                                      +++ b/zh/projects/5_project/index.html
                                      @@ -1,4 +1,4 @@
                                      -        project 5 | X - LANCE                  

                                      project 5

                                      a project with a background image

                                      Every project has a beautiful feature showcase page. It’s easy to include images in a flexible 3-column grid format. Make your photos 1/3, 2/3, or full width.

                                      To give your project a background in the portfolio page, just add the img tag to the front matter like so:

                                      ---
                                      +        project 5 | X - LANCE                  

                                      project 5

                                      a project with a background image

                                      Every project has a beautiful feature showcase page. It’s easy to include images in a flexible 3-column grid format. Make your photos 1/3, 2/3, or full width.

                                      To give your project a background in the portfolio page, just add the img tag to the front matter like so:

                                      ---
                                       layout: page
                                       title: project
                                       description: a project with a background image
                                      diff --git a/zh/projects/6_project/index.html b/zh/projects/6_project/index.html
                                      index 5337ffc50ecf..9d6476ad2ba1 100644
                                      --- a/zh/projects/6_project/index.html
                                      +++ b/zh/projects/6_project/index.html
                                      @@ -1,4 +1,4 @@
                                      -        project 6 | X - LANCE                  

                                      project 6

                                      a project with no image

                                      Every project has a beautiful feature showcase page. It’s easy to include images in a flexible 3-column grid format. Make your photos 1/3, 2/3, or full width.

                                      To give your project a background in the portfolio page, just add the img tag to the front matter like so:

                                      ---
                                      +        project 6 | X - LANCE                  

                                      project 6

                                      a project with no image

                                      Every project has a beautiful feature showcase page. It’s easy to include images in a flexible 3-column grid format. Make your photos 1/3, 2/3, or full width.

                                      To give your project a background in the portfolio page, just add the img tag to the front matter like so:

                                      ---
                                       layout: page
                                       title: project
                                       description: a project with a background image
                                      diff --git a/zh/projects/index.html b/zh/projects/index.html
                                      index e48076ccbd22..19834f634b2c 100644
                                      --- a/zh/projects/index.html
                                      +++ b/zh/projects/index.html
                                      @@ -1 +1 @@
                                      -        项目 | X - LANCE                  
                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file + 项目 | X - LANCE
                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file diff --git a/zh/repositories/index.html b/zh/repositories/index.html index cff3e4bed012..63f574b5c8f1 100644 --- a/zh/repositories/index.html +++ b/zh/repositories/index.html @@ -1 +1 @@ - 仓库 | X - LANCE

                                      仓库

                                      X-LANCE的部分GitHub项目仓库

                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file + 仓库 | X - LANCE

                                      仓库

                                      X-LANCE的部分GitHub项目仓库

                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file diff --git a/zh/sitemap.xml b/zh/sitemap.xml index 0ee0740ddacb..2ce256f960a7 100644 --- a/zh/sitemap.xml +++ b/zh/sitemap.xml @@ -1 +1 @@ - https://x-lance.github.io/news/announcement_1/ 2023-12-31T00:00:00+00:00 https://x-lance.github.io/news/announcement_2/ 2023-12-31T00:00:00+00:00 https://x-lance.github.io/news/announcement_5/ 2024-01-24T00:00:00+00:00 https://x-lance.github.io/news/announcement_3/ 2024-02-29T00:00:00+00:00 https://x-lance.github.io/news/announcement_4/ 2024-03-14T00:00:00+00:00 https://x-lance.github.io/news/announcement_6/ 2024-04-07T00:00:00+00:00 https://x-lance.github.io/news/announcement_7/ 2024-05-02T00:00:00+00:00 https://x-lance.github.io/news/announcement_8/ 2024-05-02T00:00:00+00:00 https://x-lance.github.io/news/announcement_9/ 2024-05-18T00:00:00+00:00 https://x-lance.github.io/blog/2015/formatting-and-links/ 2015-03-15T16:40:16+00:00 https://x-lance.github.io/blog/2015/images/ 2015-05-15T21:01:00+00:00 https://x-lance.github.io/blog/2015/code/ 2015-07-15T15:09:00+00:00 https://x-lance.github.io/blog/2015/math/ 2015-10-20T15:12:00+00:00 https://x-lance.github.io/blog/2015/disqus-comments/ 2015-10-20T15:59:00+00:00 https://x-lance.github.io/blog/2018/distill/ 2018-12-22T00:00:00+00:00 https://x-lance.github.io/blog/2020/twitter/ 2020-09-28T15:12:00+00:00 https://x-lance.github.io/blog/2020/github-metadata/ 2020-09-28T21:01:00+00:00 https://x-lance.github.io/blog/2021/diagrams/ 2021-07-04T17:39:00+00:00 https://x-lance.github.io/blog/2022/redirect/ 2022-02-01T17:39:00+00:00 https://x-lance.github.io/blog/2022/giscus-comments/ 2022-12-10T15:59:00+00:00 https://x-lance.github.io/blog/2023/table-of-contents/ 2023-03-20T15:59:00+00:00 https://x-lance.github.io/blog/2023/tables/ 2023-03-20T18:37:00+00:00 https://x-lance.github.io/blog/2023/videos/ 2023-04-24T21:01:00+00:00 https://x-lance.github.io/blog/2023/audios/ 2023-04-25T10:25:00+00:00 https://x-lance.github.io/blog/2023/sidebar-table-of-contents/ 2023-04-25T14:14:00+00:00 https://x-lance.github.io/blog/2023/custom-blockquotes/ 2023-05-12T19:53:00+00:00 https://x-lance.github.io/blog/2023/jupyter-notebook/ 2023-07-04T12:57:00+00:00 https://x-lance.github.io/blog/2023/post-bibliography/ 2023-07-12T13:56:00+00:00 https://x-lance.github.io/blog/2023/tikzjax/ 2023-12-12T22:25:00+00:00 https://x-lance.github.io/blog/2024/chartjs/ 2024-01-26T01:04:00+00:00 https://x-lance.github.io/blog/2024/echarts/ 2024-01-26T16:03:00+00:00 https://x-lance.github.io/blog/2024/geojson-map/ 2024-01-26T17:57:00+00:00 https://x-lance.github.io/blog/2024/vega-lite/ 2024-01-27T00:20:00+00:00 https://x-lance.github.io/blog/2024/advanced-images/ 2024-01-27T11:46:00+00:00 https://x-lance.github.io/blog/2024/code-diff/ 2024-01-27T19:22:00+00:00 https://x-lance.github.io/blog/2022/displaying-external-posts-on-your-al-folio-blog/ 2022-04-23T23:20:09+00:00 https://x-lance.github.io/projects/1_project/ 2024-05-26T02:45:34+00:00 https://x-lance.github.io/projects/2_project/ 2024-05-26T02:45:34+00:00 https://x-lance.github.io/projects/3_project/ 2024-05-26T02:45:34+00:00 https://x-lance.github.io/projects/4_project/ 2024-05-26T02:45:34+00:00 https://x-lance.github.io/projects/5_project/ 2024-05-26T02:45:34+00:00 https://x-lance.github.io/projects/6_project/ 2024-05-26T02:45:34+00:00 https://x-lance.github.io/ https://x-lance.github.io/members/alumni/ https://x-lance.github.io/cv/ https://x-lance.github.io/members/faculty/ https://x-lance.github.io/_pages/zh/members/ https://x-lance.github.io/news/ https://x-lance.github.io/papers/ https://x-lance.github.io/projects/ https://x-lance.github.io/repositories/ https://x-lance.github.io/members/student/ https://x-lance.github.io/teaching/ https://x-lance.github.io/_pages/zh/under_construction/ https://x-lance.github.io/blog/tag/formatting/ https://x-lance.github.io/blog/tag/links/ https://x-lance.github.io/blog/tag/images/ https://x-lance.github.io/blog/tag/code/ https://x-lance.github.io/blog/tag/math/ https://x-lance.github.io/blog/tag/comments/ https://x-lance.github.io/blog/tag/distill/ https://x-lance.github.io/blog/tag/metadata/ https://x-lance.github.io/blog/tag/diagrams/ https://x-lance.github.io/blog/tag/toc/ https://x-lance.github.io/blog/tag/tables/ https://x-lance.github.io/blog/tag/videos/ https://x-lance.github.io/blog/tag/audios/ https://x-lance.github.io/blog/tag/sidebar/ https://x-lance.github.io/blog/tag/blockquotes/ https://x-lance.github.io/blog/tag/jupyter/ https://x-lance.github.io/blog/tag/bib/ https://x-lance.github.io/blog/tag/charts/ https://x-lance.github.io/blog/tag/maps/ https://x-lance.github.io/blog/category/sample-posts/ https://x-lance.github.io/blog/category/external-services/ https://x-lance.github.io/blog/2015/ https://x-lance.github.io/blog/2018/ https://x-lance.github.io/blog/2020/ https://x-lance.github.io/blog/2021/ https://x-lance.github.io/blog/2022/ https://x-lance.github.io/blog/2023/ https://x-lance.github.io/blog/2024/ https://x-lance.github.io/blog/ https://x-lance.github.io/blog/page/2/ https://x-lance.github.io/blog/page/3/ https://x-lance.github.io/blog/page/4/ https://x-lance.github.io/blog/page/5/ https://x-lance.github.io/blog/page/6/ \ No newline at end of file + https://x-lance.github.io/news/announcement_1/ 2023-12-31T00:00:00+00:00 https://x-lance.github.io/news/announcement_2/ 2023-12-31T00:00:00+00:00 https://x-lance.github.io/news/announcement_5/ 2024-01-24T00:00:00+00:00 https://x-lance.github.io/news/announcement_3/ 2024-02-29T00:00:00+00:00 https://x-lance.github.io/news/announcement_4/ 2024-03-14T00:00:00+00:00 https://x-lance.github.io/news/announcement_6/ 2024-04-07T00:00:00+00:00 https://x-lance.github.io/news/announcement_7/ 2024-05-02T00:00:00+00:00 https://x-lance.github.io/news/announcement_8/ 2024-05-02T00:00:00+00:00 https://x-lance.github.io/news/announcement_9/ 2024-05-18T00:00:00+00:00 https://x-lance.github.io/blog/2015/formatting-and-links/ 2015-03-15T16:40:16+00:00 https://x-lance.github.io/blog/2015/images/ 2015-05-15T21:01:00+00:00 https://x-lance.github.io/blog/2015/code/ 2015-07-15T15:09:00+00:00 https://x-lance.github.io/blog/2015/math/ 2015-10-20T15:12:00+00:00 https://x-lance.github.io/blog/2015/disqus-comments/ 2015-10-20T15:59:00+00:00 https://x-lance.github.io/blog/2018/distill/ 2018-12-22T00:00:00+00:00 https://x-lance.github.io/blog/2020/twitter/ 2020-09-28T15:12:00+00:00 https://x-lance.github.io/blog/2020/github-metadata/ 2020-09-28T21:01:00+00:00 https://x-lance.github.io/blog/2021/diagrams/ 2021-07-04T17:39:00+00:00 https://x-lance.github.io/blog/2022/redirect/ 2022-02-01T17:39:00+00:00 https://x-lance.github.io/blog/2022/giscus-comments/ 2022-12-10T15:59:00+00:00 https://x-lance.github.io/blog/2023/table-of-contents/ 2023-03-20T15:59:00+00:00 https://x-lance.github.io/blog/2023/tables/ 2023-03-20T18:37:00+00:00 https://x-lance.github.io/blog/2023/videos/ 2023-04-24T21:01:00+00:00 https://x-lance.github.io/blog/2023/audios/ 2023-04-25T10:25:00+00:00 https://x-lance.github.io/blog/2023/sidebar-table-of-contents/ 2023-04-25T14:14:00+00:00 https://x-lance.github.io/blog/2023/custom-blockquotes/ 2023-05-12T19:53:00+00:00 https://x-lance.github.io/blog/2023/jupyter-notebook/ 2023-07-04T12:57:00+00:00 https://x-lance.github.io/blog/2023/post-bibliography/ 2023-07-12T13:56:00+00:00 https://x-lance.github.io/blog/2023/tikzjax/ 2023-12-12T22:25:00+00:00 https://x-lance.github.io/blog/2024/chartjs/ 2024-01-26T01:04:00+00:00 https://x-lance.github.io/blog/2024/echarts/ 2024-01-26T16:03:00+00:00 https://x-lance.github.io/blog/2024/geojson-map/ 2024-01-26T17:57:00+00:00 https://x-lance.github.io/blog/2024/vega-lite/ 2024-01-27T00:20:00+00:00 https://x-lance.github.io/blog/2024/advanced-images/ 2024-01-27T11:46:00+00:00 https://x-lance.github.io/blog/2024/code-diff/ 2024-01-27T19:22:00+00:00 https://x-lance.github.io/blog/2022/displaying-external-posts-on-your-al-folio-blog/ 2022-04-23T23:20:09+00:00 https://x-lance.github.io/projects/1_project/ 2024-05-26T02:56:08+00:00 https://x-lance.github.io/projects/2_project/ 2024-05-26T02:56:08+00:00 https://x-lance.github.io/projects/3_project/ 2024-05-26T02:56:08+00:00 https://x-lance.github.io/projects/4_project/ 2024-05-26T02:56:08+00:00 https://x-lance.github.io/projects/5_project/ 2024-05-26T02:56:08+00:00 https://x-lance.github.io/projects/6_project/ 2024-05-26T02:56:08+00:00 https://x-lance.github.io/ https://x-lance.github.io/members/alumni/ https://x-lance.github.io/cv/ https://x-lance.github.io/members/faculty/ https://x-lance.github.io/_pages/zh/members/ https://x-lance.github.io/news/ https://x-lance.github.io/papers/ https://x-lance.github.io/projects/ https://x-lance.github.io/repositories/ https://x-lance.github.io/members/student/ https://x-lance.github.io/teaching/ https://x-lance.github.io/_pages/zh/under_construction/ https://x-lance.github.io/blog/tag/formatting/ https://x-lance.github.io/blog/tag/links/ https://x-lance.github.io/blog/tag/images/ https://x-lance.github.io/blog/tag/code/ https://x-lance.github.io/blog/tag/math/ https://x-lance.github.io/blog/tag/comments/ https://x-lance.github.io/blog/tag/distill/ https://x-lance.github.io/blog/tag/metadata/ https://x-lance.github.io/blog/tag/diagrams/ https://x-lance.github.io/blog/tag/toc/ https://x-lance.github.io/blog/tag/tables/ https://x-lance.github.io/blog/tag/videos/ https://x-lance.github.io/blog/tag/audios/ https://x-lance.github.io/blog/tag/sidebar/ https://x-lance.github.io/blog/tag/blockquotes/ https://x-lance.github.io/blog/tag/jupyter/ https://x-lance.github.io/blog/tag/bib/ https://x-lance.github.io/blog/tag/charts/ https://x-lance.github.io/blog/tag/maps/ https://x-lance.github.io/blog/category/sample-posts/ https://x-lance.github.io/blog/category/external-services/ https://x-lance.github.io/blog/2015/ https://x-lance.github.io/blog/2018/ https://x-lance.github.io/blog/2020/ https://x-lance.github.io/blog/2021/ https://x-lance.github.io/blog/2022/ https://x-lance.github.io/blog/2023/ https://x-lance.github.io/blog/2024/ https://x-lance.github.io/blog/ https://x-lance.github.io/blog/page/2/ https://x-lance.github.io/blog/page/3/ https://x-lance.github.io/blog/page/4/ https://x-lance.github.io/blog/page/5/ https://x-lance.github.io/blog/page/6/ \ No newline at end of file diff --git a/zh/teaching/index.html b/zh/teaching/index.html index 6f09e2c15f0d..861be434188a 100644 --- a/zh/teaching/index.html +++ b/zh/teaching/index.html @@ -1 +1 @@ - 课程 | X - LANCE

                                      课程

                                      由X-LANCE开设的课程

                                      2024春

                                      • 智能语音技术 [AI2304 AI2651] 俞凯,钱彦旻

                                      2023秋

                                      • 人工智能前沿讲座 [AI3605] 俞凯
                                      • 自然语言处理 [CS3602 CS4314] 俞凯,陈露,王瑞
                                      • 计算机网络 [ICE4407P] 申丽萍
                                      • 计算机网络(D类) [CS3311] 申丽萍,阮娜
                                      • 离散数学 [CS2501] 申丽萍
                                      • 学术写作、规范与伦理 [GE6001] 吴梦玥

                                      2023春

                                      • 智能语音技术 [AI2304 AI2651] 俞凯,钱彦旻
                                      • 知识表征与推理 [AI3612] 陈露

                                      2022秋

                                      • 人工智能前沿讲座 [AI3605] 俞凯
                                      • 自然语言处理 [CS3602 CS4314] 俞凯,陈露,王瑞
                                      • 离散数学 [CS2501] 申丽萍
                                      • 程序设计思想与方法(C++) [CS1501] 陈谐
                                      • 学术写作、规范与伦理 [GE6001] 吴梦玥

                                      2022春

                                      • 智能语音技术 [AI2304 AI2651] 俞凯,钱彦旻
                                      • 知识表征与推理 [AI3612] 陈露
                                      • 智能感知认知实践 [AI3611] 吴梦玥,陈谐

                                      2021秋

                                      • 人工智能前沿讲座 [AI3605] 俞凯
                                      • 自然语言处理 [CS3602 CS4314] 俞凯,陈露,王瑞
                                      • 计算机网络(D类) [CS3311] 申丽萍,阮娜
                                      • 离散数学 [CS2501] 申丽萍

                                      2021春

                                      • 智能语音技术 [AI2304 AI2651] 俞凯,钱彦旻

                                      2020秋

                                      • 程序设计思想与方法(C++) [CS1501] 申丽萍

                                      未分类或更早

                                      • 计算机组成与体系结构 [ICE4406P] 申丽萍,赵世振
                                      • 计算机伦理学 [CS3309] 吴梦玥
                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file + 课程 | X - LANCE

                                      课程

                                      由X-LANCE开设的课程

                                      2024春

                                      • 智能语音技术 [AI2304 AI2651] 俞凯,钱彦旻

                                      2023秋

                                      • 人工智能前沿讲座 [AI3605] 俞凯
                                      • 自然语言处理 [CS3602 CS4314] 俞凯,陈露,王瑞
                                      • 计算机网络 [ICE4407P] 申丽萍
                                      • 计算机网络(D类) [CS3311] 申丽萍,阮娜
                                      • 离散数学 [CS2501] 申丽萍
                                      • 学术写作、规范与伦理 [GE6001] 吴梦玥

                                      2023春

                                      • 智能语音技术 [AI2304 AI2651] 俞凯,钱彦旻
                                      • 知识表征与推理 [AI3612] 陈露

                                      2022秋

                                      • 人工智能前沿讲座 [AI3605] 俞凯
                                      • 自然语言处理 [CS3602 CS4314] 俞凯,陈露,王瑞
                                      • 离散数学 [CS2501] 申丽萍
                                      • 程序设计思想与方法(C++) [CS1501] 陈谐
                                      • 学术写作、规范与伦理 [GE6001] 吴梦玥

                                      2022春

                                      • 智能语音技术 [AI2304 AI2651] 俞凯,钱彦旻
                                      • 知识表征与推理 [AI3612] 陈露
                                      • 智能感知认知实践 [AI3611] 吴梦玥,陈谐

                                      2021秋

                                      • 人工智能前沿讲座 [AI3605] 俞凯
                                      • 自然语言处理 [CS3602 CS4314] 俞凯,陈露,王瑞
                                      • 计算机网络(D类) [CS3311] 申丽萍,阮娜
                                      • 离散数学 [CS2501] 申丽萍

                                      2021春

                                      • 智能语音技术 [AI2304 AI2651] 俞凯,钱彦旻

                                      2020秋

                                      • 程序设计思想与方法(C++) [CS1501] 申丽萍

                                      未分类或更早

                                      • 计算机组成与体系结构 [ICE4406P] 申丽萍,赵世振
                                      • 计算机伦理学 [CS3309] 吴梦玥
                                      © Copyright 2024 X - LANCE. Powered by Jekyll with al-folio theme. Hosted by GitHub Pages. Maintained by ZC Zhu, KY Lan, and JK Yang. Last updated: May 26, 2024.
                                      \ No newline at end of file