BibTeX records: Daniel Povey

download as .bib file

@inproceedings{DBLP:conf/coling/HuangYTLRGIEYPK24,
  author       = {Ruizhe Huang and
                  Mahsa Yarmohammadi and
                  Jan Trmal and
                  Jing Liu and
                  Desh Raj and
                  Leibny Paola Garc{\'{\i}}a and
                  Alexei V. Ivanov and
                  Patrick Ehlen and
                  Mingzhi Yu and
                  Dan Povey and
                  Sanjeev Khudanpur},
  editor       = {Nicoletta Calzolari and
                  Min{-}Yen Kan and
                  V{\'{e}}ronique Hoste and
                  Alessandro Lenci and
                  Sakriani Sakti and
                  Nianwen Xue},
  title        = {ConEC: Earnings Call Dataset with Real-world Contexts for Benchmarking
                  Contextual Speech Recognition},
  booktitle    = {Proceedings of the 2024 Joint International Conference on Computational
                  Linguistics, Language Resources and Evaluation, {LREC/COLING} 2024,
                  20-25 May, 2024, Torino, Italy},
  pages        = {3700--3706},
  publisher    = {{ELRA} and {ICCL}},
  year         = {2024},
  url          = {https://aclanthology.org/2024.lrec-main.328},
  timestamp    = {Wed, 12 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/coling/HuangYTLRGIEYPK24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/YangSDM0P024,
  author       = {Yifan Yang and
                  Feiyu Shen and
                  Chenpeng Du and
                  Ziyang Ma and
                  Kai Yu and
                  Daniel Povey and
                  Xie Chen},
  title        = {Towards Universal Speech Discrete Tokens: {A} Case Study for {ASR}
                  and {TTS}},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2024, Seoul, Republic of Korea, April 14-19, 2024},
  pages        = {10401--10405},
  publisher    = {{IEEE}},
  year         = {2024},
  url          = {https://doi.org/10.1109/ICASSP48485.2024.10447751},
  doi          = {10.1109/ICASSP48485.2024.10447751},
  timestamp    = {Tue, 06 Aug 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/YangSDM0P024.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/YangKYYGKLP24,
  author       = {Xiaoyu Yang and
                  Wei Kang and
                  Zengwei Yao and
                  Yifan Yang and
                  Liyong Guo and
                  Fangjun Kuang and
                  Long Lin and
                  Daniel Povey},
  title        = {PromptASR for Contextualized {ASR} with Controllable Style},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2024, Seoul, Republic of Korea, April 14-19, 2024},
  pages        = {10536--10540},
  publisher    = {{IEEE}},
  year         = {2024},
  url          = {https://doi.org/10.1109/ICASSP48485.2024.10448264},
  doi          = {10.1109/ICASSP48485.2024.10448264},
  timestamp    = {Wed, 14 Aug 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/YangKYYGKLP24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/KangYYKYGLP24,
  author       = {Wei Kang and
                  Xiaoyu Yang and
                  Zengwei Yao and
                  Fangjun Kuang and
                  Yifan Yang and
                  Liyong Guo and
                  Long Lin and
                  Daniel Povey},
  title        = {Libriheavy: {A} 50, 000 Hours {ASR} Corpus with Punctuation Casing
                  and Context},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2024, Seoul, Republic of Korea, April 14-19, 2024},
  pages        = {10991--10995},
  publisher    = {{IEEE}},
  year         = {2024},
  url          = {https://doi.org/10.1109/ICASSP48485.2024.10447120},
  doi          = {10.1109/ICASSP48485.2024.10447120},
  timestamp    = {Tue, 13 Aug 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/KangYYKYGLP24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/Huang0NSHHMPW0P24,
  author       = {Ruizhe Huang and
                  Xiaohui Zhang and
                  Zhaoheng Ni and
                  Li Sun and
                  Moto Hira and
                  Jeff Hwang and
                  Vimal Manohar and
                  Vineel Pratap and
                  Matthew Wiesner and
                  Shinji Watanabe and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {Less Peaky and More Accurate {CTC} Forced Alignment by Label Priors},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2024, Seoul, Republic of Korea, April 14-19, 2024},
  pages        = {11831--11835},
  publisher    = {{IEEE}},
  year         = {2024},
  url          = {https://doi.org/10.1109/ICASSP48485.2024.10446111},
  doi          = {10.1109/ICASSP48485.2024.10446111},
  timestamp    = {Wed, 07 Aug 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/Huang0NSHHMPW0P24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/YaoGY0KYJLP24,
  author       = {Zengwei Yao and
                  Liyong Guo and
                  Xiaoyu Yang and
                  Wei Kang and
                  Fangjun Kuang and
                  Yifan Yang and
                  Zengrui Jin and
                  Long Lin and
                  Daniel Povey},
  title        = {Zipformer: {A} faster and better encoder for automatic speech recognition},
  booktitle    = {The Twelfth International Conference on Learning Representations,
                  {ICLR} 2024, Vienna, Austria, May 7-11, 2024},
  publisher    = {OpenReview.net},
  year         = {2024},
  url          = {https://openreview.net/forum?id=9WD9KwssyT},
  timestamp    = {Mon, 29 Jul 2024 16:19:40 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/YaoGY0KYJLP24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/odyssey/RajWM0PK24,
  author       = {Desh Raj and
                  Matthew Wiesner and
                  Matthew Maciejewski and
                  Paola Garc{\'{\i}}a and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  editor       = {Najim Dehak and
                  Patrick Cardinal},
  title        = {On Speaker Attribution with {SURT}},
  booktitle    = {Odyssey 2024: The Speaker and Language Recognition Workshop, Quebec
                  City, Canada, June 18-21, 2024},
  pages        = {91--98},
  publisher    = {{ISCA}},
  year         = {2024},
  url          = {https://doi.org/10.21437/odyssey.2024-14},
  doi          = {10.21437/ODYSSEY.2024-14},
  timestamp    = {Wed, 31 Jul 2024 15:08:41 +0200},
  biburl       = {https://dblp.org/rec/conf/odyssey/RajWM0PK24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2401-15676,
  author       = {Desh Raj and
                  Matthew Wiesner and
                  Matthew Maciejewski and
                  Leibny Paola Garc{\'{\i}}a{-}Perera and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {On Speaker Attribution with {SURT}},
  journal      = {CoRR},
  volume       = {abs/2401.15676},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2401.15676},
  doi          = {10.48550/ARXIV.2401.15676},
  eprinttype    = {arXiv},
  eprint       = {2401.15676},
  timestamp    = {Thu, 08 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2401-15676.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2406-02560,
  author       = {Ruizhe Huang and
                  Xiaohui Zhang and
                  Zhaoheng Ni and
                  Li Sun and
                  Moto Hira and
                  Jeff Hwang and
                  Vimal Manohar and
                  Vineel Pratap and
                  Matthew Wiesner and
                  Shinji Watanabe and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {Less Peaky and More Accurate {CTC} Forced Alignment by Label Priors},
  journal      = {CoRR},
  volume       = {abs/2406.02560},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2406.02560},
  doi          = {10.48550/ARXIV.2406.02560},
  eprinttype    = {arXiv},
  eprint       = {2406.02560},
  timestamp    = {Sun, 04 Aug 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2406-02560.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2406-06571,
  author       = {Quandong Wang and
                  Yuxuan Yuan and
                  Xiaoyu Yang and
                  Ruike Zhang and
                  Kang Zhao and
                  Wei Liu and
                  Jian Luan and
                  Daniel Povey and
                  Bin Wang},
  title        = {{SUBLLM:} {A} Novel Efficient Architecture with Token Sequence Subsampling
                  for {LLM}},
  journal      = {CoRR},
  volume       = {abs/2406.06571},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2406.06571},
  doi          = {10.48550/ARXIV.2406.06571},
  eprinttype    = {arXiv},
  eprint       = {2406.06571},
  timestamp    = {Tue, 13 Aug 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2406-06571.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2407-10303,
  author       = {Ruizhe Huang and
                  Mahsa Yarmohammadi and
                  Sanjeev Khudanpur and
                  Daniel Povey},
  title        = {Improving Neural Biasing for Contextual Speech Recognition by Early
                  Context Injection and Text Perturbation},
  journal      = {CoRR},
  volume       = {abs/2407.10303},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2407.10303},
  doi          = {10.48550/ARXIV.2407.10303},
  eprinttype    = {arXiv},
  eprint       = {2407.10303},
  timestamp    = {Sat, 24 Aug 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2407-10303.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/ZhuGCPZY23,
  author       = {Han Zhu and
                  Dongji Gao and
                  Gaofeng Cheng and
                  Daniel Povey and
                  Pengyuan Zhang and
                  Yonghong Yan},
  title        = {Alternative Pseudo-Labeling for Semi-Supervised Automatic Speech Recognition},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {31},
  pages        = {3320--3330},
  year         = {2023},
  url          = {https://doi.org/10.1109/TASLP.2023.3306709},
  doi          = {10.1109/TASLP.2023.3306709},
  timestamp    = {Mon, 03 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/taslp/ZhuGCPZY23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/RajPK23,
  author       = {Desh Raj and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {{SURT} 2.0: Advances in Transducer-Based Multi-Talker Speech Recognition},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {31},
  pages        = {3800--3813},
  year         = {2023},
  url          = {https://doi.org/10.1109/TASLP.2023.3318398},
  doi          = {10.1109/TASLP.2023.3318398},
  timestamp    = {Thu, 09 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/taslp/RajPK23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/asru/GaoXRGPK23,
  author       = {Dongji Gao and
                  Hainan Xu and
                  Desh Raj and
                  Leibny Paola Garc{\'{\i}}a{-}Perera and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {Learning From Flawed Data: Weakly Supervised Automatic Speech Recognition},
  booktitle    = {{IEEE} Automatic Speech Recognition and Understanding Workshop, {ASRU}
                  2023, Taipei, Taiwan, December 16-20, 2023},
  pages        = {1--8},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/ASRU57964.2023.10389684},
  doi          = {10.1109/ASRU57964.2023.10389684},
  timestamp    = {Tue, 13 Feb 2024 21:21:14 +0100},
  biburl       = {https://dblp.org/rec/conf/asru/GaoXRGPK23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/GuoYWKYCKKLLZP23,
  author       = {Liyong Guo and
                  Xiaoyu Yang and
                  Quandong Wang and
                  Yuxiang Kong and
                  Zengwei Yao and
                  Fan Cui and
                  Fangjun Kuang and
                  Wei Kang and
                  Long Lin and
                  Mingshuang Luo and
                  Piotr Zelasko and
                  Daniel Povey},
  title        = {Predicting Multi-Codebook Vector Quantization Indexes for Knowledge
                  Distillation},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing
                  {ICASSP} 2023, Rhodes Island, Greece, June 4-10, 2023},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/ICASSP49357.2023.10095268},
  doi          = {10.1109/ICASSP49357.2023.10095268},
  timestamp    = {Sun, 05 Nov 2023 16:51:21 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/GuoYWKYCKKLLZP23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/HuangWGPTK23,
  author       = {Ruizhe Huang and
                  Matthew Wiesner and
                  Leibny Paola Garc{\'{\i}}a{-}Perera and
                  Daniel Povey and
                  Jan Trmal and
                  Sanjeev Khudanpur},
  title        = {Building Keyword Search System from End-To-End Asr Systems},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing
                  {ICASSP} 2023, Rhodes Island, Greece, June 4-10, 2023},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/ICASSP49357.2023.10097249},
  doi          = {10.1109/ICASSP49357.2023.10097249},
  timestamp    = {Sun, 05 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/HuangWGPTK23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/KangGKLLYYZP23,
  author       = {Wei Kang and
                  Liyong Guo and
                  Fangjun Kuang and
                  Long Lin and
                  Mingshuang Luo and
                  Zengwei Yao and
                  Xiaoyu Yang and
                  Piotr Zelasko and
                  Daniel Povey},
  title        = {Fast and Parallel Decoding for Transducer},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing
                  {ICASSP} 2023, Rhodes Island, Greece, June 4-10, 2023},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/ICASSP49357.2023.10094567},
  doi          = {10.1109/ICASSP49357.2023.10094567},
  timestamp    = {Sun, 05 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/KangGKLLYYZP23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/KangYKGYLZP23,
  author       = {Wei Kang and
                  Zengwei Yao and
                  Fangjun Kuang and
                  Liyong Guo and
                  Xiaoyu Yang and
                  Long Lin and
                  Piotr Zelasko and
                  Daniel Povey},
  title        = {Delay-Penalized Transducer for Low-Latency Streaming {ASR}},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing
                  {ICASSP} 2023, Rhodes Island, Greece, June 4-10, 2023},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/ICASSP49357.2023.10096378},
  doi          = {10.1109/ICASSP49357.2023.10096378},
  timestamp    = {Sun, 05 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/KangYKGYLZP23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/GaoWXGPK23,
  author       = {Dongji Gao and
                  Matthew Wiesner and
                  Hainan Xu and
                  Leibny Paola Garc{\'{\i}}a and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  editor       = {Naomi Harte and
                  Julie Carson{-}Berndsen and
                  Gareth Jones},
  title        = {Bypass Temporal Classification: Weakly Supervised Automatic Speech
                  Recognition with Imperfect Transcripts},
  booktitle    = {24th Annual Conference of the International Speech Communication Association,
                  Interspeech 2023, Dublin, Ireland, August 20-24, 2023},
  pages        = {924--928},
  publisher    = {{ISCA}},
  year         = {2023},
  url          = {https://doi.org/10.21437/Interspeech.2023-2258},
  doi          = {10.21437/INTERSPEECH.2023-2258},
  timestamp    = {Fri, 14 Jun 2024 14:12:12 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/GaoWXGPK23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/Yao0KGYYLP23,
  author       = {Zengwei Yao and
                  Wei Kang and
                  Fangjun Kuang and
                  Liyong Guo and
                  Xiaoyu Yang and
                  Yifan Yang and
                  Long Lin and
                  Daniel Povey},
  editor       = {Naomi Harte and
                  Julie Carson{-}Berndsen and
                  Gareth Jones},
  title        = {Delay-penalized {CTC} Implemented Based on Finite State Transducer},
  booktitle    = {24th Annual Conference of the International Speech Communication Association,
                  Interspeech 2023, Dublin, Ireland, August 20-24, 2023},
  pages        = {1329--1333},
  publisher    = {{ISCA}},
  year         = {2023},
  url          = {https://doi.org/10.21437/Interspeech.2023-2508},
  doi          = {10.21437/INTERSPEECH.2023-2508},
  timestamp    = {Fri, 14 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/Yao0KGYYLP23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/RajPK23,
  author       = {Desh Raj and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  editor       = {Naomi Harte and
                  Julie Carson{-}Berndsen and
                  Gareth Jones},
  title        = {GPU-accelerated Guided Source Separation for Meeting Transcription},
  booktitle    = {24th Annual Conference of the International Speech Communication Association,
                  Interspeech 2023, Dublin, Ireland, August 20-24, 2023},
  pages        = {3507--3511},
  publisher    = {{ISCA}},
  year         = {2023},
  url          = {https://doi.org/10.21437/Interspeech.2023-42},
  doi          = {10.21437/INTERSPEECH.2023-42},
  timestamp    = {Sun, 04 Aug 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/RajPK23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/YangYGY0KL0P23,
  author       = {Yifan Yang and
                  Xiaoyu Yang and
                  Liyong Guo and
                  Zengwei Yao and
                  Wei Kang and
                  Fangjun Kuang and
                  Long Lin and
                  Xie Chen and
                  Daniel Povey},
  editor       = {Naomi Harte and
                  Julie Carson{-}Berndsen and
                  Gareth Jones},
  title        = {Blank-regularized {CTC} for Frame Skipping in Neural Transducer},
  booktitle    = {24th Annual Conference of the International Speech Communication Association,
                  Interspeech 2023, Dublin, Ireland, August 20-24, 2023},
  pages        = {4409--4413},
  publisher    = {{ISCA}},
  year         = {2023},
  url          = {https://doi.org/10.21437/Interspeech.2023-759},
  doi          = {10.21437/INTERSPEECH.2023-759},
  timestamp    = {Fri, 14 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/YangYGY0KL0P23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-11558,
  author       = {Yifan Yang and
                  Xiaoyu Yang and
                  Liyong Guo and
                  Zengwei Yao and
                  Wei Kang and
                  Fangjun Kuang and
                  Long Lin and
                  Xie Chen and
                  Daniel Povey},
  title        = {Blank-regularized {CTC} for Frame Skipping in Neural Transducer},
  journal      = {CoRR},
  volume       = {abs/2305.11558},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.11558},
  doi          = {10.48550/ARXIV.2305.11558},
  eprinttype    = {arXiv},
  eprint       = {2305.11558},
  timestamp    = {Wed, 20 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-11558.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-01031,
  author       = {Dongji Gao and
                  Matthew Wiesner and
                  Hainan Xu and
                  Leibny Paola Garc{\'{\i}}a and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {Bypass Temporal Classification: Weakly Supervised Automatic Speech
                  Recognition with Imperfect Transcripts},
  journal      = {CoRR},
  volume       = {abs/2306.01031},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.01031},
  doi          = {10.48550/ARXIV.2306.01031},
  eprinttype    = {arXiv},
  eprint       = {2306.01031},
  timestamp    = {Sat, 09 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-01031.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-10559,
  author       = {Desh Raj and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {{SURT} 2.0: Advances in Transducer-based Multi-talker Speech Recognition},
  journal      = {CoRR},
  volume       = {abs/2306.10559},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.10559},
  doi          = {10.48550/ARXIV.2306.10559},
  eprinttype    = {arXiv},
  eprint       = {2306.10559},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-10559.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2308-06547,
  author       = {Han Zhu and
                  Dongji Gao and
                  Gaofeng Cheng and
                  Daniel Povey and
                  Pengyuan Zhang and
                  Yonghong Yan},
  title        = {Alternative Pseudo-Labeling for Semi-Supervised Automatic Speech Recognition},
  journal      = {CoRR},
  volume       = {abs/2308.06547},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2308.06547},
  doi          = {10.48550/ARXIV.2308.06547},
  eprinttype    = {arXiv},
  eprint       = {2308.06547},
  timestamp    = {Mon, 03 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2308-06547.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2309-07377,
  author       = {Yifan Yang and
                  Feiyu Shen and
                  Chenpeng Du and
                  Ziyang Ma and
                  Kai Yu and
                  Daniel Povey and
                  Xie Chen},
  title        = {Towards Universal Speech Discrete Tokens: {A} Case Study for {ASR}
                  and {TTS}},
  journal      = {CoRR},
  volume       = {abs/2309.07377},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.07377},
  doi          = {10.48550/ARXIV.2309.07377},
  eprinttype    = {arXiv},
  eprint       = {2309.07377},
  timestamp    = {Wed, 20 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-07377.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2309-07414,
  author       = {Xiaoyu Yang and
                  Wei Kang and
                  Zengwei Yao and
                  Yifan Yang and
                  Liyong Guo and
                  Fangjun Kuang and
                  Long Lin and
                  Daniel Povey},
  title        = {PromptASR for contextualized {ASR} with controllable style},
  journal      = {CoRR},
  volume       = {abs/2309.07414},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.07414},
  doi          = {10.48550/ARXIV.2309.07414},
  eprinttype    = {arXiv},
  eprint       = {2309.07414},
  timestamp    = {Thu, 21 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-07414.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2309-08105,
  author       = {Wei Kang and
                  Xiaoyu Yang and
                  Zengwei Yao and
                  Fangjun Kuang and
                  Yifan Yang and
                  Liyong Guo and
                  Long Lin and
                  Daniel Povey},
  title        = {Libriheavy: a 50, 000 hours {ASR} corpus with punctuation casing and
                  context},
  journal      = {CoRR},
  volume       = {abs/2309.08105},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.08105},
  doi          = {10.48550/ARXIV.2309.08105},
  eprinttype    = {arXiv},
  eprint       = {2309.08105},
  timestamp    = {Tue, 26 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-08105.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2309-15796,
  author       = {Dongji Gao and
                  Hainan Xu and
                  Desh Raj and
                  Leibny Paola Garc{\'{\i}}a{-}Perera and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {Learning from Flawed Data: Weakly Supervised Automatic Speech Recognition},
  journal      = {CoRR},
  volume       = {abs/2309.15796},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.15796},
  doi          = {10.48550/ARXIV.2309.15796},
  eprinttype    = {arXiv},
  eprint       = {2309.15796},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-15796.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-11230,
  author       = {Zengwei Yao and
                  Liyong Guo and
                  Xiaoyu Yang and
                  Wei Kang and
                  Fangjun Kuang and
                  Yifan Yang and
                  Zengrui Jin and
                  Long Lin and
                  Daniel Povey},
  title        = {Zipformer: {A} faster and better encoder for automatic speech recognition},
  journal      = {CoRR},
  volume       = {abs/2310.11230},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.11230},
  doi          = {10.48550/ARXIV.2310.11230},
  eprinttype    = {arXiv},
  eprint       = {2310.11230},
  timestamp    = {Thu, 26 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-11230.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/KuangGKLLYP22,
  author       = {Fangjun Kuang and
                  Liyong Guo and
                  Wei Kang and
                  Long Lin and
                  Mingshuang Luo and
                  Zengwei Yao and
                  Daniel Povey},
  editor       = {Hanseok Ko and
                  John H. L. Hansen},
  title        = {Pruned {RNN-T} for fast, memory-efficient {ASR} training},
  booktitle    = {23rd Annual Conference of the International Speech Communication Association,
                  Interspeech 2022, Incheon, Korea, September 18-22, 2022},
  pages        = {2068--2072},
  publisher    = {{ISCA}},
  year         = {2022},
  url          = {https://doi.org/10.21437/Interspeech.2022-10340},
  doi          = {10.21437/INTERSPEECH.2022-10340},
  timestamp    = {Tue, 11 Jun 2024 16:45:43 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/KuangGKLLYP22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/cicai/2022-1,
  editor       = {Lu Fang and
                  Daniel Povey and
                  Guangtao Zhai and
                  Tao Mei and
                  Ruiping Wang},
  title        = {Artificial Intelligence - Second {CAAI} International Conference,
                  {CICAI} 2022, Beijing, China, August 27-28, 2022, Revised Selected
                  Papers, Part {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {13604},
  publisher    = {Springer},
  year         = {2022},
  url          = {https://doi.org/10.1007/978-3-031-20497-5},
  doi          = {10.1007/978-3-031-20497-5},
  isbn         = {978-3-031-20496-8},
  timestamp    = {Mon, 12 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cicai/2022-1.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/cicai/2022-2,
  editor       = {Lu Fang and
                  Daniel Povey and
                  Guangtao Zhai and
                  Tao Mei and
                  Ruiping Wang},
  title        = {Artificial Intelligence - Second {CAAI} International Conference,
                  {CICAI} 2022, Beijing, China, August 27-28, 2022, Revised Selected
                  Papers, Part {II}},
  series       = {Lecture Notes in Computer Science},
  volume       = {13605},
  publisher    = {Springer},
  year         = {2022},
  url          = {https://doi.org/10.1007/978-3-031-20500-2},
  doi          = {10.1007/978-3-031-20500-2},
  isbn         = {978-3-031-20499-9},
  timestamp    = {Mon, 12 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cicai/2022-2.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/cicai/2022-3,
  editor       = {Lu Fang and
                  Daniel Povey and
                  Guangtao Zhai and
                  Tao Mei and
                  Ruiping Wang},
  title        = {Artificial Intelligence - Second {CAAI} International Conference,
                  {CICAI} 2022, Beijing, China, August 27-28, 2022, Revised Selected
                  Papers, Part {III}},
  series       = {Lecture Notes in Computer Science},
  volume       = {13606},
  publisher    = {Springer},
  year         = {2022},
  url          = {https://doi.org/10.1007/978-3-031-20503-3},
  doi          = {10.1007/978-3-031-20503-3},
  isbn         = {978-3-031-20502-6},
  timestamp    = {Mon, 12 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cicai/2022-3.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-13236,
  author       = {Fangjun Kuang and
                  Liyong Guo and
                  Wei Kang and
                  Long Lin and
                  Mingshuang Luo and
                  Zengwei Yao and
                  Daniel Povey},
  title        = {Pruned {RNN-T} for fast, memory-efficient {ASR} training},
  journal      = {CoRR},
  volume       = {abs/2206.13236},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.13236},
  doi          = {10.48550/ARXIV.2206.13236},
  eprinttype    = {arXiv},
  eprint       = {2206.13236},
  timestamp    = {Fri, 19 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-13236.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-00484,
  author       = {Wei Kang and
                  Liyong Guo and
                  Fangjun Kuang and
                  Long Lin and
                  Mingshuang Luo and
                  Zengwei Yao and
                  Xiaoyu Yang and
                  Piotr Zelasko and
                  Daniel Povey},
  title        = {Fast and parallel decoding for transducer},
  journal      = {CoRR},
  volume       = {abs/2211.00484},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.00484},
  doi          = {10.48550/ARXIV.2211.00484},
  eprinttype    = {arXiv},
  eprint       = {2211.00484},
  timestamp    = {Fri, 19 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-00484.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-00490,
  author       = {Wei Kang and
                  Zengwei Yao and
                  Fangjun Kuang and
                  Liyong Guo and
                  Xiaoyu Yang and
                  Long Lin and
                  Piotr Zelasko and
                  Daniel Povey},
  title        = {Delay-penalized transducer for low-latency streaming {ASR}},
  journal      = {CoRR},
  volume       = {abs/2211.00490},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.00490},
  doi          = {10.48550/ARXIV.2211.00490},
  eprinttype    = {arXiv},
  eprint       = {2211.00490},
  timestamp    = {Fri, 19 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-00490.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-00508,
  author       = {Liyong Guo and
                  Xiaoyu Yang and
                  Quandong Wang and
                  Yuxiang Kong and
                  Zengwei Yao and
                  Fan Cui and
                  Fangjun Kuang and
                  Wei Kang and
                  Long Lin and
                  Mingshuang Luo and
                  Piotr Zelasko and
                  Daniel Povey},
  title        = {Predicting Multi-Codebook Vector Quantization Indexes for Knowledge
                  Distillation},
  journal      = {CoRR},
  volume       = {abs/2211.00508},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.00508},
  doi          = {10.48550/ARXIV.2211.00508},
  eprinttype    = {arXiv},
  eprint       = {2211.00508},
  timestamp    = {Fri, 19 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-00508.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2212-05271,
  author       = {Desh Raj and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {GPU-accelerated Guided Source Separation for Meeting Transcription},
  journal      = {CoRR},
  volume       = {abs/2212.05271},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2212.05271},
  doi          = {10.48550/ARXIV.2212.05271},
  eprinttype    = {arXiv},
  eprint       = {2212.05271},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2212-05271.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/spl/LvPYLWXK21,
  author       = {Hang Lv and
                  Daniel Povey and
                  Mahsa Yarmohammadi and
                  Ke Li and
                  Yiming Wang and
                  Lei Xie and
                  Sanjeev Khudanpur},
  title        = {LET-Decoder: {A} WFST-Based Lazy-Evaluation Token-Group Decoder With
                  Exact Lattice Generation},
  journal      = {{IEEE} Signal Process. Lett.},
  volume       = {28},
  pages        = {703--707},
  year         = {2021},
  url          = {https://doi.org/10.1109/LSP.2021.3067220},
  doi          = {10.1109/LSP.2021.3067220},
  timestamp    = {Mon, 25 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/spl/LvPYLWXK21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/Wang0P0K21,
  author       = {Yiming Wang and
                  Hang Lv and
                  Daniel Povey and
                  Lei Xie and
                  Sanjeev Khudanpur},
  title        = {Wake Word Detection with Streaming Transformers},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2021, Toronto, ON, Canada, June 6-11, 2021},
  pages        = {5864--5868},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/ICASSP39728.2021.9414777},
  doi          = {10.1109/ICASSP39728.2021.9414777},
  timestamp    = {Mon, 25 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/Wang0P0K21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/0001CXP0K21,
  author       = {Hang Lv and
                  Zhehuai Chen and
                  Hainan Xu and
                  Daniel Povey and
                  Lei Xie and
                  Sanjeev Khudanpur},
  title        = {An Asynchronous WFST-Based Decoder for Automatic Speech Recognition},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2021, Toronto, ON, Canada, June 6-11, 2021},
  pages        = {6019--6023},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/ICASSP39728.2021.9414509},
  doi          = {10.1109/ICASSP39728.2021.9414509},
  timestamp    = {Fri, 09 Jul 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/0001CXP0K21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/LiPK21,
  author       = {Ke Li and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {A Parallelizable Lattice Rescoring Strategy with Neural Language Models},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2021, Toronto, ON, Canada, June 6-11, 2021},
  pages        = {6518--6522},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/ICASSP39728.2021.9414714},
  doi          = {10.1109/ICASSP39728.2021.9414714},
  timestamp    = {Tue, 06 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/LiPK21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/HanPTMP21,
  author       = {Kyu Jeong Han and
                  Jing Pan and
                  Venkata Krishna Naveen Tadala and
                  Tao Ma and
                  Dan Povey},
  title        = {Multistream {CNN} for Robust Acoustic Modeling},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2021, Toronto, ON, Canada, June 6-11, 2021},
  pages        = {6873--6877},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/ICASSP39728.2021.9414639},
  doi          = {10.1109/ICASSP39728.2021.9414639},
  timestamp    = {Fri, 08 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/HanPTMP21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/ChenCWDZWSPTZJK21,
  author       = {Guoguo Chen and
                  Shuzhou Chai and
                  Guan{-}Bo Wang and
                  Jiayu Du and
                  Wei{-}Qiang Zhang and
                  Chao Weng and
                  Dan Su and
                  Daniel Povey and
                  Jan Trmal and
                  Junbo Zhang and
                  Mingjie Jin and
                  Sanjeev Khudanpur and
                  Shinji Watanabe and
                  Shuaijiang Zhao and
                  Wei Zou and
                  Xiangang Li and
                  Xuchen Yao and
                  Yongqing Wang and
                  Zhao You and
                  Zhiyong Yan},
  editor       = {Hynek Hermansky and
                  Honza Cernock{\'{y}} and
                  Luk{\'{a}}s Burget and
                  Lori Lamel and
                  Odette Scharenborg and
                  Petr Motl{\'{\i}}cek},
  title        = {GigaSpeech: An Evolving, Multi-Domain {ASR} Corpus with 10, 000 Hours
                  of Transcribed Audio},
  booktitle    = {22nd Annual Conference of the International Speech Communication Association,
                  Interspeech 2021, Brno, Czechia, August 30 - September 3, 2021},
  pages        = {3670--3674},
  publisher    = {{ISCA}},
  year         = {2021},
  url          = {https://doi.org/10.21437/Interspeech.2021-1965},
  doi          = {10.21437/INTERSPEECH.2021-1965},
  timestamp    = {Tue, 11 Jun 2024 16:45:43 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/ChenCWDZWSPTZJK21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/ZhangZWYSHLPW21,
  author       = {Junbo Zhang and
                  Zhiwen Zhang and
                  Yongqing Wang and
                  Zhiyong Yan and
                  Qiong Song and
                  Yukai Huang and
                  Ke Li and
                  Daniel Povey and
                  Yujun Wang},
  editor       = {Hynek Hermansky and
                  Honza Cernock{\'{y}} and
                  Luk{\'{a}}s Burget and
                  Lori Lamel and
                  Odette Scharenborg and
                  Petr Motl{\'{\i}}cek},
  title        = {speechocean762: An Open-Source Non-Native English Speech Corpus for
                  Pronunciation Assessment},
  booktitle    = {22nd Annual Conference of the International Speech Communication Association,
                  Interspeech 2021, Brno, Czechia, August 30 - September 3, 2021},
  pages        = {3710--3714},
  publisher    = {{ISCA}},
  year         = {2021},
  url          = {https://doi.org/10.21437/Interspeech.2021-1259},
  doi          = {10.21437/INTERSPEECH.2021-1259},
  timestamp    = {Wed, 21 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/ZhangZWYSHLPW21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/slt/RajGH0PSK21,
  author       = {Desh Raj and
                  Leibny Paola Garc{\'{\i}}a{-}Perera and
                  Zili Huang and
                  Shinji Watanabe and
                  Daniel Povey and
                  Andreas Stolcke and
                  Sanjeev Khudanpur},
  title        = {DOVER-Lap: {A} Method for Combining Overlap-Aware Diarization Outputs},
  booktitle    = {{IEEE} Spoken Language Technology Workshop, {SLT} 2021, Shenzhen,
                  China, January 19-22, 2021},
  pages        = {881--888},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/SLT48900.2021.9383490},
  doi          = {10.1109/SLT48900.2021.9383490},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/slt/RajGH0PSK21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2102-04488,
  author       = {Yiming Wang and
                  Hang Lv and
                  Daniel Povey and
                  Lei Xie and
                  Sanjeev Khudanpur},
  title        = {Wake Word Detection with Streaming Transformers},
  journal      = {CoRR},
  volume       = {abs/2102.04488},
  year         = {2021},
  url          = {https://arxiv.org/abs/2102.04488},
  eprinttype    = {arXiv},
  eprint       = {2102.04488},
  timestamp    = {Mon, 25 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2102-04488.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2103-05081,
  author       = {Ke Li and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {A Parallelizable Lattice Rescoring Strategy with Neural Language Models},
  journal      = {CoRR},
  volume       = {abs/2103.05081},
  year         = {2021},
  url          = {https://arxiv.org/abs/2103.05081},
  eprinttype    = {arXiv},
  eprint       = {2103.05081},
  timestamp    = {Tue, 06 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2103-05081.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2103-09063,
  author       = {Hang Lv and
                  Zhehuai Chen and
                  Hainan Xu and
                  Daniel Povey and
                  Lei Xie and
                  Sanjeev Khudanpur},
  title        = {An Asynchronous WFST-Based Decoder For Automatic Speech Recognition},
  journal      = {CoRR},
  volume       = {abs/2103.09063},
  year         = {2021},
  url          = {https://arxiv.org/abs/2103.09063},
  eprinttype    = {arXiv},
  eprint       = {2103.09063},
  timestamp    = {Tue, 23 Mar 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2103-09063.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2104-01378,
  author       = {Junbo Zhang and
                  Zhiwen Zhang and
                  Yongqing Wang and
                  Zhiyong Yan and
                  Qiong Song and
                  Yukai Huang and
                  Ke Li and
                  Daniel Povey and
                  Yujun Wang},
  title        = {speechocean762: An Open-Source Non-native English Speech Corpus For
                  Pronunciation Assessment},
  journal      = {CoRR},
  volume       = {abs/2104.01378},
  year         = {2021},
  url          = {https://arxiv.org/abs/2104.01378},
  eprinttype    = {arXiv},
  eprint       = {2104.01378},
  timestamp    = {Tue, 06 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2104-01378.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-06909,
  author       = {Guoguo Chen and
                  Shuzhou Chai and
                  Guanbo Wang and
                  Jiayu Du and
                  Wei{-}Qiang Zhang and
                  Chao Weng and
                  Dan Su and
                  Daniel Povey and
                  Jan Trmal and
                  Junbo Zhang and
                  Mingjie Jin and
                  Sanjeev Khudanpur and
                  Shinji Watanabe and
                  Shuaijiang Zhao and
                  Wei Zou and
                  Xiangang Li and
                  Xuchen Yao and
                  Yongqing Wang and
                  Yujun Wang and
                  Zhao You and
                  Zhiyong Yan},
  title        = {GigaSpeech: An Evolving, Multi-domain {ASR} Corpus with 10, 000 Hours
                  of Transcribed Audio},
  journal      = {CoRR},
  volume       = {abs/2106.06909},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.06909},
  eprinttype    = {arXiv},
  eprint       = {2106.06909},
  timestamp    = {Tue, 19 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-06909.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2110-12561,
  author       = {Piotr Zelasko and
                  Daniel Povey and
                  Jan "Yenda" Trmal and
                  Sanjeev Khudanpur},
  title        = {Lhotse: a speech data representation library for the modern deep learning
                  ecosystem},
  journal      = {CoRR},
  volume       = {abs/2110.12561},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.12561},
  eprinttype    = {arXiv},
  eprint       = {2110.12561},
  timestamp    = {Thu, 28 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-12561.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/ZhangPK20,
  author       = {Xiaohui Zhang and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {{OOV} Recovery with Efficient 2nd Pass Decoding and Open-vocabulary
                  Word-level {RNNLM} Rescoring for Hybrid {ASR}},
  booktitle    = {2020 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2020, Barcelona, Spain, May 4-8, 2020},
  pages        = {6334--6338},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/ICASSP40776.2020.9053872},
  doi          = {10.1109/ICASSP40776.2020.9053872},
  timestamp    = {Thu, 04 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/ZhangPK20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/HuangWFGSPK20,
  author       = {Zili Huang and
                  Shinji Watanabe and
                  Yusuke Fujita and
                  Paola Garc{\'{\i}}a and
                  Yiwen Shao and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {Speaker Diarization with Region Proposal Network},
  booktitle    = {2020 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2020, Barcelona, Spain, May 4-8, 2020},
  pages        = {6514--6518},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/ICASSP40776.2020.9053760},
  doi          = {10.1109/ICASSP40776.2020.9053760},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/HuangWFGSPK20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/BraunLLKP20,
  author       = {Hugo Braun and
                  Justin Luitjens and
                  Ryan Leary and
                  Tim Kaldewey and
                  Daniel Povey},
  title        = {Gpu-Accelerated Viterbi Exact Lattice Decoder for Batched Online and
                  Offline Speech Recognition},
  booktitle    = {2020 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2020, Barcelona, Spain, May 4-8, 2020},
  pages        = {7874--7878},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/ICASSP40776.2020.9054099},
  doi          = {10.1109/ICASSP40776.2020.9054099},
  timestamp    = {Thu, 23 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/BraunLLKP20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/LiLHHPPK20,
  author       = {Ke Li and
                  Zhe Liu and
                  Tianxing He and
                  Hongzhao Huang and
                  Fuchun Peng and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {An Empirical Study of Transformer-Based Neural Language Model Adaptation},
  booktitle    = {2020 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2020, Barcelona, Spain, May 4-8, 2020},
  pages        = {7934--7938},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/ICASSP40776.2020.9053399},
  doi          = {10.1109/ICASSP40776.2020.9053399},
  timestamp    = {Tue, 06 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/LiLHHPPK20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/ShaoWPK20,
  author       = {Yiwen Shao and
                  Yiming Wang and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  editor       = {Helen Meng and
                  Bo Xu and
                  Thomas Fang Zheng},
  title        = {PyChain: {A} Fully Parallelized PyTorch Implementation of {LF-MMI}
                  for End-to-End {ASR}},
  booktitle    = {21st Annual Conference of the International Speech Communication Association,
                  Interspeech 2020, Virtual Event, Shanghai, China, October 25-29, 2020},
  pages        = {561--565},
  publisher    = {{ISCA}},
  year         = {2020},
  url          = {https://doi.org/10.21437/Interspeech.2020-3053},
  doi          = {10.21437/INTERSPEECH.2020-3053},
  timestamp    = {Tue, 11 Jun 2024 16:45:43 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/ShaoWPK20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/GhahramaniHPHK20,
  author       = {Pegah Ghahramani and
                  Hossein Hadian and
                  Daniel Povey and
                  Hynek Hermansky and
                  Sanjeev Khudanpur},
  editor       = {Helen Meng and
                  Bo Xu and
                  Thomas Fang Zheng},
  title        = {An Alternative to MFCCs for {ASR}},
  booktitle    = {21st Annual Conference of the International Speech Communication Association,
                  Interspeech 2020, Virtual Event, Shanghai, China, October 25-29, 2020},
  pages        = {1664--1667},
  publisher    = {{ISCA}},
  year         = {2020},
  url          = {https://doi.org/10.21437/Interspeech.2020-2690},
  doi          = {10.21437/INTERSPEECH.2020-2690},
  timestamp    = {Sun, 04 Aug 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/GhahramaniHPHK20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/LiPK20,
  author       = {Ke Li and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  editor       = {Helen Meng and
                  Bo Xu and
                  Thomas Fang Zheng},
  title        = {Neural Language Modeling with Implicit Cache Pointers},
  booktitle    = {21st Annual Conference of the International Speech Communication Association,
                  Interspeech 2020, Virtual Event, Shanghai, China, October 25-29, 2020},
  pages        = {3625--3629},
  publisher    = {{ISCA}},
  year         = {2020},
  url          = {https://doi.org/10.21437/Interspeech.2020-3020},
  doi          = {10.21437/INTERSPEECH.2020-3020},
  timestamp    = {Tue, 06 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/LiPK20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/Wang0P0K20,
  author       = {Yiming Wang and
                  Hang Lv and
                  Daniel Povey and
                  Lei Xie and
                  Sanjeev Khudanpur},
  editor       = {Helen Meng and
                  Bo Xu and
                  Thomas Fang Zheng},
  title        = {Wake Word Detection with Alignment-Free Lattice-Free {MMI}},
  booktitle    = {21st Annual Conference of the International Speech Communication Association,
                  Interspeech 2020, Virtual Event, Shanghai, China, October 25-29, 2020},
  pages        = {4258--4262},
  publisher    = {{ISCA}},
  year         = {2020},
  url          = {https://doi.org/10.21437/Interspeech.2020-1811},
  doi          = {10.21437/INTERSPEECH.2020-1811},
  timestamp    = {Mon, 25 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/Wang0P0K20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/MadikeriKTMBP20,
  author       = {Srikanth R. Madikeri and
                  Banriskhem K. Khonglah and
                  Sibo Tong and
                  Petr Motl{\'{\i}}cek and
                  Herv{\'{e}} Bourlard and
                  Daniel Povey},
  editor       = {Helen Meng and
                  Bo Xu and
                  Thomas Fang Zheng},
  title        = {Lattice-Free Maximum Mutual Information Training of Multilingual Speech
                  Recognition Systems},
  booktitle    = {21st Annual Conference of the International Speech Communication Association,
                  Interspeech 2020, Virtual Event, Shanghai, China, October 25-29, 2020},
  pages        = {4746--4750},
  publisher    = {{ISCA}},
  year         = {2020},
  url          = {https://doi.org/10.21437/Interspeech.2020-2919},
  doi          = {10.21437/INTERSPEECH.2020-2919},
  timestamp    = {Fri, 29 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/MadikeriKTMBP20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/HuangLAPK20,
  author       = {Ruizhe Huang and
                  Ke Li and
                  Ashish Arora and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  editor       = {Helen Meng and
                  Bo Xu and
                  Thomas Fang Zheng},
  title        = {Efficient {MDI} Adaptation for n-Gram Language Models},
  booktitle    = {21st Annual Conference of the International Speech Communication Association,
                  Interspeech 2020, Virtual Event, Shanghai, China, October 25-29, 2020},
  pages        = {4916--4920},
  publisher    = {{ISCA}},
  year         = {2020},
  url          = {https://doi.org/10.21437/Interspeech.2020-2909},
  doi          = {10.21437/INTERSPEECH.2020-2909},
  timestamp    = {Tue, 06 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/HuangLAPK20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-06220,
  author       = {Zili Huang and
                  Shinji Watanabe and
                  Yusuke Fujita and
                  Paola Garc{\'{\i}}a and
                  Yiwen Shao and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {Speaker Diarization with Region Proposal Network},
  journal      = {CoRR},
  volume       = {abs/2002.06220},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.06220},
  eprinttype    = {arXiv},
  eprint       = {2002.06220},
  timestamp    = {Thu, 07 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-06220.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2005-08347,
  author       = {Yiming Wang and
                  Hang Lv and
                  Daniel Povey and
                  Lei Xie and
                  Sanjeev Khudanpur},
  title        = {Wake Word Detection with Alignment-Free Lattice-Free {MMI}},
  journal      = {CoRR},
  volume       = {abs/2005.08347},
  year         = {2020},
  url          = {https://arxiv.org/abs/2005.08347},
  eprinttype    = {arXiv},
  eprint       = {2005.08347},
  timestamp    = {Mon, 25 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2005-08347.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2005-09824,
  author       = {Yiwen Shao and
                  Yiming Wang and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {PyChain: {A} Fully Parallelized PyTorch Implementation of {LF-MMI}
                  for End-to-End {ASR}},
  journal      = {CoRR},
  volume       = {abs/2005.09824},
  year         = {2020},
  url          = {https://arxiv.org/abs/2005.09824},
  eprinttype    = {arXiv},
  eprint       = {2005.09824},
  timestamp    = {Mon, 25 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2005-09824.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2005-10470,
  author       = {Kyu Jeong Han and
                  Jing Pan and
                  Venkata Krishna Naveen Tadala and
                  Tao Ma and
                  Dan Povey},
  title        = {Multistream {CNN} for Robust Acoustic Modeling},
  journal      = {CoRR},
  volume       = {abs/2005.10470},
  year         = {2020},
  url          = {https://arxiv.org/abs/2005.10470},
  eprinttype    = {arXiv},
  eprint       = {2005.10470},
  timestamp    = {Fri, 08 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2005-10470.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2008-02385,
  author       = {Ruizhe Huang and
                  Ke Li and
                  Ashish Arora and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {Efficient {MDI} Adaptation for n-gram Language Models},
  journal      = {CoRR},
  volume       = {abs/2008.02385},
  year         = {2020},
  url          = {https://arxiv.org/abs/2008.02385},
  eprinttype    = {arXiv},
  eprint       = {2008.02385},
  timestamp    = {Tue, 06 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2008-02385.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2011-01997,
  author       = {Desh Raj and
                  Leibny Paola Garc{\'{\i}}a{-}Perera and
                  Zili Huang and
                  Shinji Watanabe and
                  Daniel Povey and
                  Andreas Stolcke and
                  Sanjeev Khudanpur},
  title        = {DOVER-Lap: {A} Method for Combining Overlap-aware Diarization Outputs},
  journal      = {CoRR},
  volume       = {abs/2011.01997},
  year         = {2020},
  url          = {https://arxiv.org/abs/2011.01997},
  eprinttype    = {arXiv},
  eprint       = {2011.01997},
  timestamp    = {Wed, 29 Dec 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2011-01997.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2011-02090,
  author       = {Desh Raj and
                  Jes{\'{u}}s Villalba and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {Frustratingly Easy Noise-aware Training of Acoustic Models},
  journal      = {CoRR},
  volume       = {abs/2011.02090},
  year         = {2020},
  url          = {https://arxiv.org/abs/2011.02090},
  eprinttype    = {arXiv},
  eprint       = {2011.02090},
  timestamp    = {Wed, 26 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2011-02090.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/asru/ChenYXLXPK19,
  author       = {Zhehuai Chen and
                  Mahsa Yarmohammadi and
                  Hainan Xu and
                  Hang Lv and
                  Lei Xie and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {Incremental Lattice Determinization for {WFST} Decoders},
  booktitle    = {{IEEE} Automatic Speech Recognition and Understanding Workshop, {ASRU}
                  2019, Singapore, December 14-18, 2019},
  pages        = {1--7},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ASRU46091.2019.9004006},
  doi          = {10.1109/ASRU46091.2019.9004006},
  timestamp    = {Mon, 24 Feb 2020 17:51:31 +0100},
  biburl       = {https://dblp.org/rec/conf/asru/ChenYXLXPK19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/asru/RajSPK19,
  author       = {Desh Raj and
                  David Snyder and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {Probing the Information Encoded in X-Vectors},
  booktitle    = {{IEEE} Automatic Speech Recognition and Understanding Workshop, {ASRU}
                  2019, Singapore, December 14-18, 2019},
  pages        = {726--733},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ASRU46091.2019.9003979},
  doi          = {10.1109/ASRU46091.2019.9003979},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/asru/RajSPK19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/SnyderGSMPK19,
  author       = {David Snyder and
                  Daniel Garcia{-}Romero and
                  Gregory Sell and
                  Alan McCree and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {Speaker Recognition for Multi-speaker Conversations Using X-vectors},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2019, Brighton, United Kingdom, May 12-17, 2019},
  pages        = {5796--5800},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ICASSP.2019.8683760},
  doi          = {10.1109/ICASSP.2019.8683760},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/SnyderGSMPK19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icdar/ChangAGEPK19,
  author       = {Chun{-}Chieh Chang and
                  Ashish Arora and
                  Leibny Paola Garc{\'{\i}}a{-}Perera and
                  David Etter and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {Optical Character Recognition with Chinese and Korean Character Decomposition},
  booktitle    = {Second International Workshop on Machine Learning, WML@ICDAR 2019,
                  Sydney, Australia, September 22-25, 2019},
  pages        = {134--139},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ICDARW.2019.40094},
  doi          = {10.1109/ICDARW.2019.40094},
  timestamp    = {Wed, 13 Nov 2019 17:12:21 +0100},
  biburl       = {https://dblp.org/rec/conf/icdar/ChangAGEPK19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icdar/AroraGWMSKCRBPE19,
  author       = {Ashish Arora and
                  Paola Garc{\'{\i}}a and
                  Shinji Watanabe and
                  Vimal Manohar and
                  Yiwen Shao and
                  Sanjeev Khudanpur and
                  Chun{-}Chieh Chang and
                  Babak Rekabdar and
                  Bagher BabaAli and
                  Daniel Povey and
                  David Etter and
                  Desh Raj and
                  Hossein Hadian and
                  Jan Trmal},
  title        = {Using {ASR} Methods for {OCR}},
  booktitle    = {2019 International Conference on Document Analysis and Recognition,
                  {ICDAR} 2019, Sydney, Australia, September 20-25, 2019},
  pages        = {663--668},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ICDAR.2019.00111},
  doi          = {10.1109/ICDAR.2019.00111},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icdar/AroraGWMSKCRBPE19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/WuGPK19,
  author       = {Fei Wu and
                  Leibny Paola Garc{\'{\i}}a{-}Perera and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  editor       = {Gernot Kubin and
                  Zdravko Kacic},
  title        = {Advances in Automatic Speech Recognition for Child Speech Using Factored
                  Time Delay Neural Network},
  booktitle    = {20th Annual Conference of the International Speech Communication Association,
                  Interspeech 2019, Graz, Austria, September 15-19, 2019},
  pages        = {1--5},
  publisher    = {{ISCA}},
  year         = {2019},
  url          = {https://doi.org/10.21437/Interspeech.2019-2980},
  doi          = {10.21437/INTERSPEECH.2019-2980},
  timestamp    = {Tue, 11 Jun 2024 16:45:43 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/WuGPK19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/XieGPK19,
  author       = {Jiamin Xie and
                  Leibny Paola Garc{\'{\i}}a{-}Perera and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  editor       = {Gernot Kubin and
                  Zdravko Kacic},
  title        = {Multi-PLDA Diarization on Children's Speech},
  booktitle    = {20th Annual Conference of the International Speech Communication Association,
                  Interspeech 2019, Graz, Austria, September 15-19, 2019},
  pages        = {376--380},
  publisher    = {{ISCA}},
  year         = {2019},
  url          = {https://doi.org/10.21437/Interspeech.2019-2961},
  doi          = {10.21437/INTERSPEECH.2019-2961},
  timestamp    = {Fri, 29 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/XieGPK19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/VillalbaCSGMSBR19,
  author       = {Jes{\'{u}}s Villalba and
                  Nanxin Chen and
                  David Snyder and
                  Daniel Garcia{-}Romero and
                  Alan McCree and
                  Gregory Sell and
                  Jonas Borgstrom and
                  Fred Richardson and
                  Suwon Shon and
                  Fran{\c{c}}ois Grondin and
                  R{\'{e}}da Dehak and
                  Leibny Paola Garc{\'{\i}}a{-}Perera and
                  Daniel Povey and
                  Pedro A. Torres{-}Carrasquillo and
                  Sanjeev Khudanpur and
                  Najim Dehak},
  editor       = {Gernot Kubin and
                  Zdravko Kacic},
  title        = {State-of-the-Art Speaker Recognition for Telephone and Video Speech:
                  The {JHU-MIT} Submission for {NIST} {SRE18}},
  booktitle    = {20th Annual Conference of the International Speech Communication Association,
                  Interspeech 2019, Graz, Austria, September 15-19, 2019},
  pages        = {1488--1492},
  publisher    = {{ISCA}},
  year         = {2019},
  url          = {https://doi.org/10.21437/Interspeech.2019-2713},
  doi          = {10.21437/INTERSPEECH.2019-2713},
  timestamp    = {Wed, 26 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/VillalbaCSGMSBR19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/Garcia-RomeroSS19,
  author       = {Daniel Garcia{-}Romero and
                  David Snyder and
                  Gregory Sell and
                  Alan McCree and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  editor       = {Gernot Kubin and
                  Zdravko Kacic},
  title        = {x-Vector {DNN} Refinement with Full-Length Recordings for Speaker
                  Recognition},
  booktitle    = {20th Annual Conference of the International Speech Communication Association,
                  Interspeech 2019, Graz, Austria, September 15-19, 2019},
  pages        = {1493--1496},
  publisher    = {{ISCA}},
  year         = {2019},
  url          = {https://doi.org/10.21437/Interspeech.2019-2205},
  doi          = {10.21437/INTERSPEECH.2019-2205},
  timestamp    = {Fri, 29 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/Garcia-RomeroSS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/Garcia-RomeroSW19,
  author       = {Daniel Garcia{-}Romero and
                  David Snyder and
                  Shinji Watanabe and
                  Gregory Sell and
                  Alan McCree and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  editor       = {Gernot Kubin and
                  Zdravko Kacic},
  title        = {Speaker Recognition Benchmark Using the CHiME-5 Corpus},
  booktitle    = {20th Annual Conference of the International Speech Communication Association,
                  Interspeech 2019, Graz, Austria, September 15-19, 2019},
  pages        = {1506--1510},
  publisher    = {{ISCA}},
  year         = {2019},
  url          = {https://doi.org/10.21437/Interspeech.2019-2174},
  doi          = {10.21437/INTERSPEECH.2019-2174},
  timestamp    = {Fri, 29 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/Garcia-RomeroSW19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/SnyderVCPSDK19,
  author       = {David Snyder and
                  Jes{\'{u}}s Villalba and
                  Nanxin Chen and
                  Daniel Povey and
                  Gregory Sell and
                  Najim Dehak and
                  Sanjeev Khudanpur},
  editor       = {Gernot Kubin and
                  Zdravko Kacic},
  title        = {The {JHU} Speaker Recognition System for the VOiCES 2019 Challenge},
  booktitle    = {20th Annual Conference of the International Speech Communication Association,
                  Interspeech 2019, Graz, Austria, September 15-19, 2019},
  pages        = {2468--2472},
  publisher    = {{ISCA}},
  year         = {2019},
  url          = {https://doi.org/10.21437/Interspeech.2019-2979},
  doi          = {10.21437/INTERSPEECH.2019-2979},
  timestamp    = {Wed, 26 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/SnyderVCPSDK19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/WangSXMNPK19,
  author       = {Yiming Wang and
                  David Snyder and
                  Hainan Xu and
                  Vimal Manohar and
                  Phani Sankar Nidadavolu and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  editor       = {Gernot Kubin and
                  Zdravko Kacic},
  title        = {The {JHU} {ASR} System for VOiCES from a Distance Challenge 2019},
  booktitle    = {20th Annual Conference of the International Speech Communication Association,
                  Interspeech 2019, Graz, Austria, September 15-19, 2019},
  pages        = {2488--2492},
  publisher    = {{ISCA}},
  year         = {2019},
  url          = {https://doi.org/10.21437/Interspeech.2019-1948},
  doi          = {10.21437/INTERSPEECH.2019-1948},
  timestamp    = {Mon, 25 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/WangSXMNPK19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/SarmaGPGSD19,
  author       = {Mousmita Sarma and
                  Pegah Ghahremani and
                  Daniel Povey and
                  Nagendra Kumar Goel and
                  Kandarpa Kumar Sarma and
                  Najim Dehak},
  editor       = {Gernot Kubin and
                  Zdravko Kacic},
  title        = {Improving Emotion Identification Using Phone Posteriors in Raw Speech
                  Waveform Based {DNN}},
  booktitle    = {20th Annual Conference of the International Speech Communication Association,
                  Interspeech 2019, Graz, Austria, September 15-19, 2019},
  pages        = {3925--3929},
  publisher    = {{ISCA}},
  year         = {2019},
  url          = {https://doi.org/10.21437/Interspeech.2019-2093},
  doi          = {10.21437/INTERSPEECH.2019-2093},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/SarmaGPGSD19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/mtsummit/YarmohammadiMHR19,
  author       = {Mahsa Yarmohammadi and
                  Xutai Ma and
                  Sorami Hisamoto and
                  Muhammad Rahman and
                  Yiming Wang and
                  Hainan Xu and
                  Daniel Povey and
                  Philipp Koehn and
                  Kevin Duh},
  editor       = {Mikel L. Forcada and
                  Andy Way and
                  Barry Haddow and
                  Rico Sennrich},
  title        = {Robust Document Representations for Cross-Lingual Information Retrieval
                  in Low-Resource Settings},
  booktitle    = {Proceedings of Machine Translation Summit {XVII} Volume 1: Research
                  Track, MTSummit 2019, Dublin, Ireland, August 19-23, 2019},
  pages        = {12--20},
  publisher    = {European Association for Machine Translation},
  year         = {2019},
  url          = {https://aclanthology.org/W19-6602/},
  timestamp    = {Mon, 25 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/mtsummit/YarmohammadiMHR19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1909-06351,
  author       = {Desh Raj and
                  David Snyder and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {Probing the Information Encoded in x-vectors},
  journal      = {CoRR},
  volume       = {abs/1909.06351},
  year         = {2019},
  url          = {http://arxiv.org/abs/1909.06351},
  eprinttype    = {arXiv},
  eprint       = {1909.06351},
  timestamp    = {Wed, 18 Sep 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1909-06351.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/spl/PeddintiWPK18,
  author       = {Vijayaditya Peddinti and
                  Yiming Wang and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {Low Latency Acoustic Modeling Using Temporal Convolution and LSTMs},
  journal      = {{IEEE} Signal Process. Lett.},
  volume       = {25},
  number       = {3},
  pages        = {373--377},
  year         = {2018},
  url          = {https://doi.org/10.1109/LSP.2017.2723507},
  doi          = {10.1109/LSP.2017.2723507},
  timestamp    = {Mon, 25 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/spl/PeddintiWPK18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/HadianSPK18,
  author       = {Hossein Hadian and
                  Hossein Sameti and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {Flat-Start Single-Stage Discriminatively Trained HMM-Based Models
                  for {ASR}},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {26},
  number       = {11},
  pages        = {1949--1961},
  year         = {2018},
  url          = {https://doi.org/10.1109/TASLP.2018.2848701},
  doi          = {10.1109/TASLP.2018.2848701},
  timestamp    = {Fri, 13 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/taslp/HadianSPK18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iberspeech/HuangGVPD18,
  author       = {Zili Huang and
                  L. Paola Garc{\'{\i}}a{-}Perera and
                  Jes{\'{u}}s Villalba and
                  Daniel Povey and
                  Najim Dehak},
  editor       = {Jordi Luque and
                  Antonio Bonafonte and
                  Francesc Al{\'{\i}}as Pujol and
                  Ant{\'{o}}nio J. S. Teixeira},
  title        = {{JHU} Diarization System Description},
  booktitle    = {Fourth International Conference, IberSPEECH 2018, Barcelona, Spain,
                  21-23 November 2018, Proceedings},
  pages        = {236--239},
  publisher    = {{ISCA}},
  year         = {2018},
  url          = {https://doi.org/10.21437/IberSPEECH.2018-49},
  doi          = {10.21437/IBERSPEECH.2018-49},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iberspeech/HuangGVPD18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/ManoharHPK18,
  author       = {Vimal Manohar and
                  Hossein Hadian and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {Semi-Supervised Training of Acoustic Models Using Lattice-Free {MMI}},
  booktitle    = {2018 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2018, Calgary, AB, Canada, April 15-20, 2018},
  pages        = {4844--4848},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/ICASSP.2018.8462331},
  doi          = {10.1109/ICASSP.2018.8462331},
  timestamp    = {Mon, 15 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/ManoharHPK18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/SnyderGSPK18,
  author       = {David Snyder and
                  Daniel Garcia{-}Romero and
                  Gregory Sell and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {X-Vectors: Robust {DNN} Embeddings for Speaker Recognition},
  booktitle    = {2018 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2018, Calgary, AB, Canada, April 15-20, 2018},
  pages        = {5329--5333},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/ICASSP.2018.8461375},
  doi          = {10.1109/ICASSP.2018.8461375},
  timestamp    = {Tue, 18 Sep 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/SnyderGSPK18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/PoveyHGLK18,
  author       = {Daniel Povey and
                  Hossein Hadian and
                  Pegah Ghahremani and
                  Ke Li and
                  Sanjeev Khudanpur},
  title        = {A Time-Restricted Self-Attention Layer for {ASR}},
  booktitle    = {2018 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2018, Calgary, AB, Canada, April 15-20, 2018},
  pages        = {5874--5878},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/ICASSP.2018.8462497},
  doi          = {10.1109/ICASSP.2018.8462497},
  timestamp    = {Tue, 06 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/PoveyHGLK18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/XuCGWLGCPK18,
  author       = {Hainan Xu and
                  Tongfei Chen and
                  Dongji Gao and
                  Yiming Wang and
                  Ke Li and
                  Nagendra Goel and
                  Yishay Carmiel and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {A Pruned Rnnlm Lattice-Rescoring Algorithm for Automatic Speech Recognition},
  booktitle    = {2018 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2018, Calgary, AB, Canada, April 15-20, 2018},
  pages        = {5929--5933},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/ICASSP.2018.8461974},
  doi          = {10.1109/ICASSP.2018.8461974},
  timestamp    = {Mon, 25 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/XuCGWLGCPK18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/XuLWWKCPK18,
  author       = {Hainan Xu and
                  Ke Li and
                  Yiming Wang and
                  Jian Wang and
                  Shiyin Kang and
                  Xie Chen and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {Neural Network Language Modeling with Letter-Based Features and Importance
                  Sampling},
  booktitle    = {2018 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2018, Calgary, AB, Canada, April 15-20, 2018},
  pages        = {6109--6113},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/ICASSP.2018.8461704},
  doi          = {10.1109/ICASSP.2018.8461704},
  timestamp    = {Mon, 25 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/XuLWWKCPK18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/HadianSPK18,
  author       = {Hossein Hadian and
                  Hossein Sameti and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  editor       = {B. Yegnanarayana},
  title        = {End-to-end Speech Recognition Using Lattice-free {MMI}},
  booktitle    = {19th Annual Conference of the International Speech Communication Association,
                  Interspeech 2018, Hyderabad, India, September 2-6, 2018},
  pages        = {12--16},
  publisher    = {{ISCA}},
  year         = {2018},
  url          = {https://doi.org/10.21437/Interspeech.2018-1423},
  doi          = {10.21437/INTERSPEECH.2018-1423},
  timestamp    = {Tue, 11 Jun 2024 16:45:43 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/HadianSPK18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/GhahremaniNCVPK18,
  author       = {Pegah Ghahremani and
                  Phani Sankar Nidadavolu and
                  Nanxin Chen and
                  Jes{\'{u}}s Villalba and
                  Daniel Povey and
                  Sanjeev Khudanpur and
                  Najim Dehak},
  editor       = {B. Yegnanarayana},
  title        = {End-to-end Deep Neural Network Age Estimation},
  booktitle    = {19th Annual Conference of the International Speech Communication Association,
                  Interspeech 2018, Hyderabad, India, September 2-6, 2018},
  pages        = {277--281},
  publisher    = {{ISCA}},
  year         = {2018},
  url          = {https://doi.org/10.21437/Interspeech.2018-2015},
  doi          = {10.21437/INTERSPEECH.2018-2015},
  timestamp    = {Wed, 26 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/GhahremaniNCVPK18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/GhahremaniHLPK18,
  author       = {Pegah Ghahremani and
                  Hossein Hadian and
                  Hang Lv and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  editor       = {B. Yegnanarayana},
  title        = {Acoustic Modeling from Frequency Domain Representations of Speech},
  booktitle    = {19th Annual Conference of the International Speech Communication Association,
                  Interspeech 2018, Hyderabad, India, September 2-6, 2018},
  pages        = {1596--1600},
  publisher    = {{ISCA}},
  year         = {2018},
  url          = {https://doi.org/10.21437/Interspeech.2018-1453},
  doi          = {10.21437/INTERSPEECH.2018-1453},
  timestamp    = {Fri, 29 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/GhahremaniHLPK18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/ChengPHXK018,
  author       = {Gaofeng Cheng and
                  Daniel Povey and
                  Lu Huang and
                  Ji Xu and
                  Sanjeev Khudanpur and
                  Yonghong Yan},
  editor       = {B. Yegnanarayana},
  title        = {Output-Gate Projected Gated Recurrent Unit for Speech Recognition},
  booktitle    = {19th Annual Conference of the International Speech Communication Association,
                  Interspeech 2018, Hyderabad, India, September 2-6, 2018},
  pages        = {1793--1797},
  publisher    = {{ISCA}},
  year         = {2018},
  url          = {https://doi.org/10.21437/Interspeech.2018-1403},
  doi          = {10.21437/INTERSPEECH.2018-1403},
  timestamp    = {Fri, 29 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/ChengPHXK018.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/ChenLXWPK18,
  author       = {Zhehuai Chen and
                  Justin Luitjens and
                  Hainan Xu and
                  Yiming Wang and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  editor       = {B. Yegnanarayana},
  title        = {A GPU-based {WFST} Decoder with Exact Lattice Generation},
  booktitle    = {19th Annual Conference of the International Speech Communication Association,
                  Interspeech 2018, Hyderabad, India, September 2-6, 2018},
  pages        = {2212--2216},
  publisher    = {{ISCA}},
  year         = {2018},
  url          = {https://doi.org/10.21437/Interspeech.2018-1339},
  doi          = {10.21437/INTERSPEECH.2018-1339},
  timestamp    = {Mon, 25 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/ChenLXWPK18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/SellSMGVMMDPWK18,
  author       = {Gregory Sell and
                  David Snyder and
                  Alan McCree and
                  Daniel Garcia{-}Romero and
                  Jes{\'{u}}s Villalba and
                  Matthew Maciejewski and
                  Vimal Manohar and
                  Najim Dehak and
                  Daniel Povey and
                  Shinji Watanabe and
                  Sanjeev Khudanpur},
  editor       = {B. Yegnanarayana},
  title        = {Diarization is Hard: Some Experiences and Lessons Learned for the
                  {JHU} Team in the Inaugural {DIHARD} Challenge},
  booktitle    = {19th Annual Conference of the International Speech Communication Association,
                  Interspeech 2018, Hyderabad, India, September 2-6, 2018},
  pages        = {2808--2812},
  publisher    = {{ISCA}},
  year         = {2018},
  url          = {https://doi.org/10.21437/Interspeech.2018-1893},
  doi          = {10.21437/INTERSPEECH.2018-1893},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/SellSMGVMMDPWK18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/SarmaGPGSD18,
  author       = {Mousmita Sarma and
                  Pegah Ghahremani and
                  Daniel Povey and
                  Nagendra Kumar Goel and
                  Kandarpa Kumar Sarma and
                  Najim Dehak},
  editor       = {B. Yegnanarayana},
  title        = {Emotion Identification from Raw Speech Signals Using DNNs},
  booktitle    = {19th Annual Conference of the International Speech Communication Association,
                  Interspeech 2018, Hyderabad, India, September 2-6, 2018},
  pages        = {3097--3101},
  publisher    = {{ISCA}},
  year         = {2018},
  url          = {https://doi.org/10.21437/Interspeech.2018-1353},
  doi          = {10.21437/INTERSPEECH.2018-1353},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/SarmaGPGSD18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/LiXWPK18,
  author       = {Ke Li and
                  Hainan Xu and
                  Yiming Wang and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  editor       = {B. Yegnanarayana},
  title        = {Recurrent Neural Network Language Model Adaptation for Conversational
                  Speech Recognition},
  booktitle    = {19th Annual Conference of the International Speech Communication Association,
                  Interspeech 2018, Hyderabad, India, September 2-6, 2018},
  pages        = {3373--3377},
  publisher    = {{ISCA}},
  year         = {2018},
  url          = {https://doi.org/10.21437/Interspeech.2018-1413},
  doi          = {10.21437/INTERSPEECH.2018-1413},
  timestamp    = {Mon, 25 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/LiXWPK18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/ZhuKSMP18,
  author       = {Yingke Zhu and
                  Tom Ko and
                  David Snyder and
                  Brian Mak and
                  Daniel Povey},
  editor       = {B. Yegnanarayana},
  title        = {Self-Attentive Speaker Embeddings for Text-Independent Speaker Verification},
  booktitle    = {19th Annual Conference of the International Speech Communication Association,
                  Interspeech 2018, Hyderabad, India, September 2-6, 2018},
  pages        = {3573--3577},
  publisher    = {{ISCA}},
  year         = {2018},
  url          = {https://doi.org/10.21437/Interspeech.2018-1158},
  doi          = {10.21437/INTERSPEECH.2018-1158},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/ZhuKSMP18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/PoveyCWLXYK18,
  author       = {Daniel Povey and
                  Gaofeng Cheng and
                  Yiming Wang and
                  Ke Li and
                  Hainan Xu and
                  Mahsa Yarmohammadi and
                  Sanjeev Khudanpur},
  editor       = {B. Yegnanarayana},
  title        = {Semi-Orthogonal Low-Rank Matrix Factorization for Deep Neural Networks},
  booktitle    = {19th Annual Conference of the International Speech Communication Association,
                  Interspeech 2018, Hyderabad, India, September 2-6, 2018},
  pages        = {3743--3747},
  publisher    = {{ISCA}},
  year         = {2018},
  url          = {https://doi.org/10.21437/Interspeech.2018-1417},
  doi          = {10.21437/INTERSPEECH.2018-1417},
  timestamp    = {Sun, 12 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/PoveyCWLXYK18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/odyssey/SnyderGMSPK18,
  author       = {David Snyder and
                  Daniel Garcia{-}Romero and
                  Alan McCree and
                  Gregory Sell and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  editor       = {Anthony Larcher and
                  Jean{-}Fran{\c{c}}ois Bonastre},
  title        = {Spoken Language Recognition using X-vectors},
  booktitle    = {Odyssey 2018: The Speaker and Language Recognition Workshop, 26-29
                  June 2018, Les Sables d'Olonne, France},
  pages        = {105--111},
  publisher    = {{ISCA}},
  year         = {2018},
  url          = {https://doi.org/10.21437/Odyssey.2018-15},
  doi          = {10.21437/ODYSSEY.2018-15},
  timestamp    = {Tue, 30 Jul 2024 09:37:28 +0200},
  biburl       = {https://dblp.org/rec/conf/odyssey/SnyderGMSPK18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/slt/HadianPSTK18,
  author       = {Hossein Hadian and
                  Daniel Povey and
                  Hossein Sameti and
                  Jan Trmal and
                  Sanjeev Khudanpur},
  title        = {Improving {LF-MMI} Using Unconstrained Supervisions for {ASR}},
  booktitle    = {2018 {IEEE} Spoken Language Technology Workshop, {SLT} 2018, Athens,
                  Greece, December 18-21, 2018},
  pages        = {43--47},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/SLT.2018.8639684},
  doi          = {10.1109/SLT.2018.8639684},
  timestamp    = {Mon, 15 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/slt/HadianPSTK18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/slt/ManoharGPK18,
  author       = {Vimal Manohar and
                  Pegah Ghahremani and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {A Teacher-Student Learning Approach for Unsupervised Domain Adaptation
                  of Sequence-Trained {ASR} Models},
  booktitle    = {2018 {IEEE} Spoken Language Technology Workshop, {SLT} 2018, Athens,
                  Greece, December 18-21, 2018},
  pages        = {250--257},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/SLT.2018.8639635},
  doi          = {10.1109/SLT.2018.8639635},
  timestamp    = {Fri, 15 Feb 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/slt/ManoharGPK18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1804-03243,
  author       = {Zhehuai Chen and
                  Justin Luitjens and
                  Hainan Xu and
                  Yiming Wang and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {A GPU-based {WFST} Decoder with Exact Lattice Generation},
  journal      = {CoRR},
  volume       = {abs/1804.03243},
  year         = {2018},
  url          = {http://arxiv.org/abs/1804.03243},
  eprinttype    = {arXiv},
  eprint       = {1804.03243},
  timestamp    = {Mon, 25 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1804-03243.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/asru/GhahremaniMHPK17,
  author       = {Pegah Ghahremani and
                  Vimal Manohar and
                  Hossein Hadian and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {Investigation of transfer learning for {ASR} using {LF-MMI} trained
                  neural networks},
  booktitle    = {2017 {IEEE} Automatic Speech Recognition and Understanding Workshop,
                  {ASRU} 2017, Okinawa, Japan, December 16-20, 2017},
  pages        = {279--286},
  publisher    = {{IEEE}},
  year         = {2017},
  url          = {https://doi.org/10.1109/ASRU.2017.8268947},
  doi          = {10.1109/ASRU.2017.8268947},
  timestamp    = {Mon, 15 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/asru/GhahremaniMHPK17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/asru/ManoharPK17,
  author       = {Vimal Manohar and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {{JHU} Kaldi system for Arabic {MGB-3} {ASR} challenge using diarization,
                  audio-transcript alignment and transfer learning},
  booktitle    = {2017 {IEEE} Automatic Speech Recognition and Understanding Workshop,
                  {ASRU} 2017, Okinawa, Japan, December 16-20, 2017},
  pages        = {346--352},
  publisher    = {{IEEE}},
  year         = {2017},
  url          = {https://doi.org/10.1109/ASRU.2017.8268956},
  doi          = {10.1109/ASRU.2017.8268956},
  timestamp    = {Tue, 30 Jan 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/asru/ManoharPK17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/Garcia-RomeroSS17,
  author       = {Daniel Garcia{-}Romero and
                  David Snyder and
                  Gregory Sell and
                  Daniel Povey and
                  Alan McCree},
  title        = {Speaker diarization using deep neural network embeddings},
  booktitle    = {2017 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2017, New Orleans, LA, USA, March 5-9, 2017},
  pages        = {4930--4934},
  publisher    = {{IEEE}},
  year         = {2017},
  url          = {https://doi.org/10.1109/ICASSP.2017.7953094},
  doi          = {10.1109/ICASSP.2017.7953094},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/Garcia-RomeroSS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/KoPPSK17,
  author       = {Tom Ko and
                  Vijayaditya Peddinti and
                  Daniel Povey and
                  Michael L. Seltzer and
                  Sanjeev Khudanpur},
  title        = {A study on data augmentation of reverberant speech for robust speech
                  recognition},
  booktitle    = {2017 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2017, New Orleans, LA, USA, March 5-9, 2017},
  pages        = {5220--5224},
  publisher    = {{IEEE}},
  year         = {2017},
  url          = {https://doi.org/10.1109/ICASSP.2017.7953152},
  doi          = {10.1109/ICASSP.2017.7953152},
  timestamp    = {Fri, 02 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/KoPPSK17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/HadianPSK17,
  author       = {Hossein Hadian and
                  Daniel Povey and
                  Hossein Sameti and
                  Sanjeev Khudanpur},
  editor       = {Francisco Lacerda},
  title        = {Phone Duration Modeling for {LVCSR} Using Neural Networks},
  booktitle    = {18th Annual Conference of the International Speech Communication Association,
                  Interspeech 2017, Stockholm, Sweden, August 20-24, 2017},
  pages        = {518--522},
  publisher    = {{ISCA}},
  year         = {2017},
  url          = {https://doi.org/10.21437/Interspeech.2017-1680},
  doi          = {10.21437/INTERSPEECH.2017-1680},
  timestamp    = {Tue, 11 Jun 2024 16:45:43 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/HadianPSK17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/SnyderGPK17,
  author       = {David Snyder and
                  Daniel Garcia{-}Romero and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  editor       = {Francisco Lacerda},
  title        = {Deep Neural Network Embeddings for Text-Independent Speaker Verification},
  booktitle    = {18th Annual Conference of the International Speech Communication Association,
                  Interspeech 2017, Stockholm, Sweden, August 20-24, 2017},
  pages        = {999--1003},
  publisher    = {{ISCA}},
  year         = {2017},
  url          = {https://doi.org/10.21437/Interspeech.2017-620},
  doi          = {10.21437/INTERSPEECH.2017-620},
  timestamp    = {Sun, 12 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/SnyderGPK17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/ChengPPMKY17,
  author       = {Gaofeng Cheng and
                  Vijayaditya Peddinti and
                  Daniel Povey and
                  Vimal Manohar and
                  Sanjeev Khudanpur and
                  Yonghong Yan},
  editor       = {Francisco Lacerda},
  title        = {An Exploration of Dropout with LSTMs},
  booktitle    = {18th Annual Conference of the International Speech Communication Association,
                  Interspeech 2017, Stockholm, Sweden, August 20-24, 2017},
  pages        = {1586--1590},
  publisher    = {{ISCA}},
  year         = {2017},
  url          = {https://doi.org/10.21437/Interspeech.2017-129},
  doi          = {10.21437/INTERSPEECH.2017-129},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/ChengPPMKY17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/WangPXZPK17,
  author       = {Yiming Wang and
                  Vijayaditya Peddinti and
                  Hainan Xu and
                  Xiaohui Zhang and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  editor       = {Francisco Lacerda},
  title        = {Backstitch: Counteracting Finite-Sample Bias via Negative Steps},
  booktitle    = {18th Annual Conference of the International Speech Communication Association,
                  Interspeech 2017, Stockholm, Sweden, August 20-24, 2017},
  pages        = {1631--1635},
  publisher    = {{ISCA}},
  year         = {2017},
  url          = {https://doi.org/10.21437/Interspeech.2017-1323},
  doi          = {10.21437/INTERSPEECH.2017-1323},
  timestamp    = {Thu, 04 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/WangPXZPK17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/ZhangMPK17,
  author       = {Xiaohui Zhang and
                  Vimal Manohar and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  editor       = {Francisco Lacerda},
  title        = {Acoustic Data-Driven Lexicon Learning Based on a Greedy Pronunciation
                  Selection Framework},
  booktitle    = {18th Annual Conference of the International Speech Communication Association,
                  Interspeech 2017, Stockholm, Sweden, August 20-24, 2017},
  pages        = {2541--2545},
  publisher    = {{ISCA}},
  year         = {2017},
  url          = {https://doi.org/10.21437/Interspeech.2017-588},
  doi          = {10.21437/INTERSPEECH.2017-588},
  timestamp    = {Thu, 04 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/ZhangMPK17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/TrmalWPZGWMXPK17,
  author       = {Jan Trmal and
                  Matthew Wiesner and
                  Vijayaditya Peddinti and
                  Xiaohui Zhang and
                  Pegah Ghahremani and
                  Yiming Wang and
                  Vimal Manohar and
                  Hainan Xu and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  editor       = {Francisco Lacerda},
  title        = {The Kaldi OpenKWS System: Improving Low Resource Keyword Search},
  booktitle    = {18th Annual Conference of the International Speech Communication Association,
                  Interspeech 2017, Stockholm, Sweden, August 20-24, 2017},
  pages        = {3597--3601},
  publisher    = {{ISCA}},
  year         = {2017},
  url          = {https://doi.org/10.21437/Interspeech.2017-601},
  doi          = {10.21437/INTERSPEECH.2017-601},
  timestamp    = {Thu, 04 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/TrmalWPZGWMXPK17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ZhangMPK17,
  author       = {Xiaohui Zhang and
                  Vimal Manohar and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {Acoustic data-driven lexicon learning based on a greedy pronunciation
                  selection framework},
  journal      = {CoRR},
  volume       = {abs/1706.03747},
  year         = {2017},
  url          = {http://arxiv.org/abs/1706.03747},
  eprinttype    = {arXiv},
  eprint       = {1706.03747},
  timestamp    = {Thu, 04 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ZhangMPK17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/ChenPK16,
  author       = {Guoguo Chen and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {Acoustic data-driven pronunciation lexicon generation for logographic
                  languages},
  booktitle    = {2016 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2016, Shanghai, China, March 20-25, 2016},
  pages        = {5350--5354},
  publisher    = {{IEEE}},
  year         = {2016},
  url          = {https://doi.org/10.1109/ICASSP.2016.7472699},
  doi          = {10.1109/ICASSP.2016.7472699},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/ChenPK16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/PeddintiMWPK16,
  author       = {Vijayaditya Peddinti and
                  Vimal Manohar and
                  Yiming Wang and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  editor       = {Nelson Morgan},
  title        = {Far-Field {ASR} Without Parallel Data},
  booktitle    = {17th Annual Conference of the International Speech Communication Association,
                  Interspeech 2016, San Francisco, CA, USA, September 8-12, 2016},
  pages        = {1996--2000},
  publisher    = {{ISCA}},
  year         = {2016},
  url          = {https://doi.org/10.21437/Interspeech.2016-1475},
  doi          = {10.21437/INTERSPEECH.2016-1475},
  timestamp    = {Tue, 11 Jun 2024 16:45:43 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/PeddintiMWPK16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/PoveyPGGMNWK16,
  author       = {Daniel Povey and
                  Vijayaditya Peddinti and
                  Daniel Galvez and
                  Pegah Ghahremani and
                  Vimal Manohar and
                  Xingyu Na and
                  Yiming Wang and
                  Sanjeev Khudanpur},
  editor       = {Nelson Morgan},
  title        = {Purely Sequence-Trained Neural Networks for {ASR} Based on Lattice-Free
                  {MMI}},
  booktitle    = {17th Annual Conference of the International Speech Communication Association,
                  Interspeech 2016, San Francisco, CA, USA, September 8-12, 2016},
  pages        = {2751--2755},
  publisher    = {{ISCA}},
  year         = {2016},
  url          = {https://doi.org/10.21437/Interspeech.2016-595},
  doi          = {10.21437/INTERSPEECH.2016-595},
  timestamp    = {Sun, 12 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/PoveyPGGMNWK16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/GhahremaniMPK16,
  author       = {Pegah Ghahremani and
                  Vimal Manohar and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  editor       = {Nelson Morgan},
  title        = {Acoustic Modelling from the Signal Domain Using CNNs},
  booktitle    = {17th Annual Conference of the International Speech Communication Association,
                  Interspeech 2016, San Francisco, CA, USA, September 8-12, 2016},
  pages        = {3434--3438},
  publisher    = {{ISCA}},
  year         = {2016},
  url          = {https://doi.org/10.21437/Interspeech.2016-1495},
  doi          = {10.21437/INTERSPEECH.2016-1495},
  timestamp    = {Fri, 29 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/GhahremaniMPK16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/slt/SnyderGPGCK16,
  author       = {David Snyder and
                  Pegah Ghahremani and
                  Daniel Povey and
                  Daniel Garcia{-}Romero and
                  Yishay Carmiel and
                  Sanjeev Khudanpur},
  title        = {Deep neural network-based speaker embeddings for end-to-end speaker
                  verification},
  booktitle    = {2016 {IEEE} Spoken Language Technology Workshop, {SLT} 2016, San Diego,
                  CA, USA, December 13-16, 2016},
  pages        = {165--170},
  publisher    = {{IEEE}},
  year         = {2016},
  url          = {https://doi.org/10.1109/SLT.2016.7846260},
  doi          = {10.1109/SLT.2016.7846260},
  timestamp    = {Wed, 16 Oct 2019 14:14:53 +0200},
  biburl       = {https://dblp.org/rec/conf/slt/SnyderGPGCK16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/asru/SnyderGP15,
  author       = {David Snyder and
                  Daniel Garcia{-}Romero and
                  Daniel Povey},
  title        = {Time delay deep neural network-based universal background models for
                  speaker recognition},
  booktitle    = {2015 {IEEE} Workshop on Automatic Speech Recognition and Understanding,
                  {ASRU} 2015, Scottsdale, AZ, USA, December 13-17, 2015},
  pages        = {92--97},
  publisher    = {{IEEE}},
  year         = {2015},
  url          = {https://doi.org/10.1109/ASRU.2015.7404779},
  doi          = {10.1109/ASRU.2015.7404779},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/asru/SnyderGP15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/asru/PeddintiCMKPK15,
  author       = {Vijayaditya Peddinti and
                  Guoguo Chen and
                  Vimal Manohar and
                  Tom Ko and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {{JHU} ASpIRE system: Robust {LVCSR} with TDNNS, iVector adaptation
                  and {RNN-LMS}},
  booktitle    = {2015 {IEEE} Workshop on Automatic Speech Recognition and Understanding,
                  {ASRU} 2015, Scottsdale, AZ, USA, December 13-17, 2015},
  pages        = {539--546},
  publisher    = {{IEEE}},
  year         = {2015},
  url          = {https://doi.org/10.1109/ASRU.2015.7404842},
  doi          = {10.1109/ASRU.2015.7404842},
  timestamp    = {Fri, 02 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/asru/PeddintiCMKPK15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/KumarBTPK15,
  author       = {Gaurav Kumar and
                  Graeme W. Blackwood and
                  Jan Trmal and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  editor       = {Llu{\'{\i}}s M{\`{a}}rquez and
                  Chris Callison{-}Burch and
                  Jian Su and
                  Daniele Pighin and
                  Yuval Marton},
  title        = {A Coarse-Grained Model for Optimal Coupling of {ASR} and {SMT} Systems
                  for Speech Translation},
  booktitle    = {Proceedings of the 2015 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2015, Lisbon, Portugal, September 17-21,
                  2015},
  pages        = {1902--1907},
  publisher    = {The Association for Computational Linguistics},
  year         = {2015},
  url          = {https://doi.org/10.18653/v1/d15-1218},
  doi          = {10.18653/V1/D15-1218},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/KumarBTPK15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/PanayotovCPK15,
  author       = {Vassil Panayotov and
                  Guoguo Chen and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {Librispeech: An {ASR} corpus based on public domain audio books},
  booktitle    = {2015 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2015, South Brisbane, Queensland, Australia,
                  April 19-24, 2015},
  pages        = {5206--5210},
  publisher    = {{IEEE}},
  year         = {2015},
  url          = {https://doi.org/10.1109/ICASSP.2015.7178964},
  doi          = {10.1109/ICASSP.2015.7178964},
  timestamp    = {Fri, 25 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/PanayotovCPK15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/ChenXWPK15,
  author       = {Guoguo Chen and
                  Hainan Xu and
                  Minhua Wu and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {Pronunciation and silence probability modeling for {ASR}},
  booktitle    = {16th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2015, Dresden, Germany, September 6-10, 2015},
  pages        = {533--537},
  publisher    = {{ISCA}},
  year         = {2015},
  url          = {https://doi.org/10.21437/Interspeech.2015-198},
  doi          = {10.21437/INTERSPEECH.2015-198},
  timestamp    = {Tue, 11 Jun 2024 16:45:43 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/ChenXWPK15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/XuCPK15,
  author       = {Hainan Xu and
                  Guoguo Chen and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {Modeling phonetic context with non-random forests for speech recognition},
  booktitle    = {16th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2015, Dresden, Germany, September 6-10, 2015},
  pages        = {2117--2121},
  publisher    = {{ISCA}},
  year         = {2015},
  url          = {https://doi.org/10.21437/Interspeech.2015-478},
  doi          = {10.21437/INTERSPEECH.2015-478},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/XuCPK15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/PeddintiCPK15,
  author       = {Vijayaditya Peddinti and
                  Guoguo Chen and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {Reverberation robust acoustic modeling using i-vectors with time delay
                  neural networks},
  booktitle    = {16th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2015, Dresden, Germany, September 6-10, 2015},
  pages        = {2440--2444},
  publisher    = {{ISCA}},
  year         = {2015},
  url          = {https://doi.org/10.21437/Interspeech.2015-527},
  doi          = {10.21437/INTERSPEECH.2015-527},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/PeddintiCPK15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/ManoharPK15,
  author       = {Vimal Manohar and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {Semi-supervised maximum mutual information training of deep neural
                  network acoustic models},
  booktitle    = {16th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2015, Dresden, Germany, September 6-10, 2015},
  pages        = {2630--2634},
  publisher    = {{ISCA}},
  year         = {2015},
  url          = {https://doi.org/10.21437/Interspeech.2015-561},
  doi          = {10.21437/INTERSPEECH.2015-561},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/ManoharPK15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/PeddintiPK15,
  author       = {Vijayaditya Peddinti and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {A time delay neural network architecture for efficient modeling of
                  long temporal contexts},
  booktitle    = {16th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2015, Dresden, Germany, September 6-10, 2015},
  pages        = {3214--3218},
  publisher    = {{ISCA}},
  year         = {2015},
  url          = {https://doi.org/10.21437/Interspeech.2015-647},
  doi          = {10.21437/INTERSPEECH.2015-647},
  timestamp    = {Sun, 12 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/PeddintiPK15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/KoPPK15,
  author       = {Tom Ko and
                  Vijayaditya Peddinti and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {Audio augmentation for speech recognition},
  booktitle    = {16th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2015, Dresden, Germany, September 6-10, 2015},
  pages        = {3586--3589},
  publisher    = {{ISCA}},
  year         = {2015},
  url          = {https://doi.org/10.21437/Interspeech.2015-711},
  doi          = {10.21437/INTERSPEECH.2015-711},
  timestamp    = {Sun, 12 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/KoPPK15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/ZhangPK15,
  author       = {Xiaohui Zhang and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {A diversity-penalizing ensemble training method for deep learning},
  booktitle    = {16th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2015, Dresden, Germany, September 6-10, 2015},
  pages        = {3590--3594},
  publisher    = {{ISCA}},
  year         = {2015},
  url          = {https://doi.org/10.21437/Interspeech.2015-712},
  doi          = {10.21437/INTERSPEECH.2015-712},
  timestamp    = {Thu, 04 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/ZhangPK15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/PoveyZK14,
  author       = {Daniel Povey and
                  Xiaohui Zhang and
                  Sanjeev Khudanpur},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {Parallel training of Deep Neural Networks with Natural Gradient and
                  Parameter Averaging},
  booktitle    = {3rd International Conference on Learning Representations, {ICLR} 2015,
                  San Diego, CA, USA, May 7-9, 2015, Workshop Track Proceedings},
  year         = {2015},
  url          = {http://arxiv.org/abs/1410.7455},
  timestamp    = {Thu, 04 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/PoveyZK14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/SnyderCP15,
  author       = {David Snyder and
                  Guoguo Chen and
                  Daniel Povey},
  title        = {{MUSAN:} {A} Music, Speech, and Noise Corpus},
  journal      = {CoRR},
  volume       = {abs/1510.08484},
  year         = {2015},
  url          = {http://arxiv.org/abs/1510.08484},
  eprinttype    = {arXiv},
  eprint       = {1510.08484},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/SnyderCP15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/ZhangTPK14,
  author       = {Xiaohui Zhang and
                  Jan Trmal and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {Improving deep neural network acoustic models using generalized maxout
                  networks},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2014, Florence, Italy, May 4-9, 2014},
  pages        = {215--219},
  publisher    = {{IEEE}},
  year         = {2014},
  url          = {https://doi.org/10.1109/ICASSP.2014.6853589},
  doi          = {10.1109/ICASSP.2014.6853589},
  timestamp    = {Thu, 04 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/ZhangTPK14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/GhahremaniBPRTK14,
  author       = {Pegah Ghahremani and
                  Bagher BabaAli and
                  Daniel Povey and
                  Korbinian Riedhammer and
                  Jan Trmal and
                  Sanjeev Khudanpur},
  title        = {A pitch extraction algorithm tuned for automatic speech recognition},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2014, Florence, Italy, May 4-9, 2014},
  pages        = {2494--2498},
  publisher    = {{IEEE}},
  year         = {2014},
  url          = {https://doi.org/10.1109/ICASSP.2014.6854049},
  doi          = {10.1109/ICASSP.2014.6854049},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/GhahremaniBPRTK14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/KumarPPK14,
  author       = {Gaurav Kumar and
                  Matt Post and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {Some insights from translating conversational telephone speech},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2014, Florence, Italy, May 4-9, 2014},
  pages        = {3231--3235},
  publisher    = {{IEEE}},
  year         = {2014},
  url          = {https://doi.org/10.1109/ICASSP.2014.6854197},
  doi          = {10.1109/ICASSP.2014.6854197},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/KumarPPK14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/VuIPMSB14,
  author       = {Ngoc Thang Vu and
                  David Imseng and
                  Daniel Povey and
                  Petr Motl{\'{\i}}cek and
                  Tanja Schultz and
                  Herv{\'{e}} Bourlard},
  title        = {Multilingual deep neural network based acoustic modeling for rapid
                  language adaptation},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2014, Florence, Italy, May 4-9, 2014},
  pages        = {7639--7643},
  publisher    = {{IEEE}},
  year         = {2014},
  url          = {https://doi.org/10.1109/ICASSP.2014.6855086},
  doi          = {10.1109/ICASSP.2014.6855086},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/VuIPMSB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/NoldenSPGMN14,
  author       = {David Nolden and
                  Hagen Soltau and
                  Daniel Povey and
                  Pegah Ghahremani and
                  Lidia Mangu and
                  Hermann Ney},
  editor       = {Haizhou Li and
                  Helen M. Meng and
                  Bin Ma and
                  Engsiong Chng and
                  Lei Xie},
  title        = {Removing redundancy from lattices},
  booktitle    = {15th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2014, Singapore, September 14-18, 2014},
  pages        = {656--660},
  publisher    = {{ISCA}},
  year         = {2014},
  url          = {https://doi.org/10.21437/Interspeech.2014-166},
  doi          = {10.21437/INTERSPEECH.2014-166},
  timestamp    = {Tue, 11 Jun 2024 16:45:43 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/NoldenSPGMN14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/ChiuWTPCR14,
  author       = {Justin T. Chiu and
                  Yun Wang and
                  Jan Trmal and
                  Daniel Povey and
                  Guoguo Chen and
                  Alexander I. Rudnicky},
  editor       = {Haizhou Li and
                  Helen M. Meng and
                  Bin Ma and
                  Engsiong Chng and
                  Lei Xie},
  title        = {Combination of {FST} and {CN} search in spoken term detection},
  booktitle    = {15th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2014, Singapore, September 14-18, 2014},
  pages        = {2784--2788},
  publisher    = {{ISCA}},
  year         = {2014},
  url          = {https://doi.org/10.21437/Interspeech.2014-532},
  doi          = {10.21437/INTERSPEECH.2014-532},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/ChiuWTPCR14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iwslt/Kumar0CCPK14,
  author       = {Gaurav Kumar and
                  Yuan Cao and
                  Ryan Cotterell and
                  Chris Callison{-}Burch and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {Translations of the Callhome Egyptian Arabic corpus for conversational
                  speech translation},
  booktitle    = {Proceedings of the 11th International Workshop on Spoken Language
                  Translation: Papers, {IWSLT} 2014, Lake Tahoe, CA, USA, December 4-5,
                  2014},
  year         = {2014},
  url          = {https://aclanthology.org/2014.iwslt-papers.13},
  timestamp    = {Thu, 01 Aug 2024 15:37:24 +0200},
  biburl       = {https://dblp.org/rec/conf/iwslt/Kumar0CCPK14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/slt/Garcia-RomeroZM14,
  author       = {Daniel Garcia{-}Romero and
                  Xiaohui Zhang and
                  Alan McCree and
                  Daniel Povey},
  title        = {Improving speaker recognition performance in the domain adaptation
                  challenge using deep neural networks},
  booktitle    = {2014 {IEEE} Spoken Language Technology Workshop, {SLT} 2014, South
                  Lake Tahoe, NV, USA, December 7-10, 2014},
  pages        = {378--383},
  publisher    = {{IEEE}},
  year         = {2014},
  url          = {https://doi.org/10.1109/SLT.2014.7078604},
  doi          = {10.1109/SLT.2014.7078604},
  timestamp    = {Thu, 04 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/slt/Garcia-RomeroZM14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/slt/TrmalCPKGZMLJKY14,
  author       = {Jan Trmal and
                  Guoguo Chen and
                  Daniel Povey and
                  Sanjeev Khudanpur and
                  Pegah Ghahremani and
                  Xiaohui Zhang and
                  Vimal Manohar and
                  Chunxi Liu and
                  Aren Jansen and
                  Dietrich Klakow and
                  David Yarowsky and
                  Florian Metze},
  title        = {A keyword search system using open source software},
  booktitle    = {2014 {IEEE} Spoken Language Technology Workshop, {SLT} 2014, South
                  Lake Tahoe, NV, USA, December 7-10, 2014},
  pages        = {530--535},
  publisher    = {{IEEE}},
  year         = {2014},
  url          = {https://doi.org/10.1109/SLT.2014.7078630},
  doi          = {10.1109/SLT.2014.7078630},
  timestamp    = {Thu, 04 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/slt/TrmalCPKGZMLJKY14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/asru/ChenYTPK13,
  author       = {Guoguo Chen and
                  Oguz Yilmaz and
                  Jan Trmal and
                  Daniel Povey and
                  Sanjeev Khudanpur},
  title        = {Using proxies for {OOV} keywords in the keyword search task},
  booktitle    = {2013 {IEEE} Workshop on Automatic Speech Recognition and Understanding,
                  Olomouc, Czech Republic, December 8-12, 2013},
  pages        = {416--421},
  publisher    = {{IEEE}},
  year         = {2013},
  url          = {https://doi.org/10.1109/ASRU.2013.6707766},
  doi          = {10.1109/ASRU.2013.6707766},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/asru/ChenYTPK13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/HannemannPZ13,
  author       = {Mirko Hannemann and
                  Daniel Povey and
                  Geoffrey Zweig},
  title        = {Combining forward and backward search in decoding},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2013, Vancouver, BC, Canada, May 26-31, 2013},
  pages        = {6739--6743},
  publisher    = {{IEEE}},
  year         = {2013},
  url          = {https://doi.org/10.1109/ICASSP.2013.6638966},
  doi          = {10.1109/ICASSP.2013.6638966},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/HannemannPZ13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/MotlicekPK13,
  author       = {Petr Motl{\'{\i}}cek and
                  Daniel Povey and
                  Martin Karafi{\'{a}}t},
  title        = {Feature and score level combination of subspace Gaussinas in {LVCSR}
                  task},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2013, Vancouver, BC, Canada, May 26-31, 2013},
  pages        = {7604--7608},
  publisher    = {{IEEE}},
  year         = {2013},
  url          = {https://doi.org/10.1109/ICASSP.2013.6639142},
  doi          = {10.1109/ICASSP.2013.6639142},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/MotlicekPK13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/ChenKPTYY13,
  author       = {Guoguo Chen and
                  Sanjeev Khudanpur and
                  Daniel Povey and
                  Jan Trmal and
                  David Yarowsky and
                  Oguz Yilmaz},
  title        = {Quantifying the value of pronunciation lexicons for keyword search
                  in lowresource languages},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2013, Vancouver, BC, Canada, May 26-31, 2013},
  pages        = {8560--8564},
  publisher    = {{IEEE}},
  year         = {2013},
  url          = {https://doi.org/10.1109/ICASSP.2013.6639336},
  doi          = {10.1109/ICASSP.2013.6639336},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/ChenKPTYY13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/RathPVC13,
  author       = {Shakti P. Rath and
                  Daniel Povey and
                  Karel Vesel{\'{y}} and
                  Jan Cernock{\'{y}}},
  editor       = {Fr{\'{e}}d{\'{e}}ric Bimbot and
                  Christophe Cerisara and
                  C{\'{e}}cile Fougeron and
                  Guillaume Gravier and
                  Lori Lamel and
                  Fran{\c{c}}ois Pellegrino and
                  Pascal Perrier},
  title        = {Improved feature processing for deep neural networks},
  booktitle    = {14th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2013, Lyon, France, August 25-29, 2013},
  pages        = {109--113},
  publisher    = {{ISCA}},
  year         = {2013},
  url          = {https://doi.org/10.21437/Interspeech.2013-48},
  doi          = {10.21437/INTERSPEECH.2013-48},
  timestamp    = {Tue, 11 Jun 2024 16:45:43 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/RathPVC13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/VeselyGBP13,
  author       = {Karel Vesel{\'{y}} and
                  Arnab Ghoshal and
                  Luk{\'{a}}s Burget and
                  Daniel Povey},
  editor       = {Fr{\'{e}}d{\'{e}}ric Bimbot and
                  Christophe Cerisara and
                  C{\'{e}}cile Fougeron and
                  Guillaume Gravier and
                  Lori Lamel and
                  Fran{\c{c}}ois Pellegrino and
                  Pascal Perrier},
  title        = {Sequence-discriminative training of deep neural networks},
  booktitle    = {14th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2013, Lyon, France, August 25-29, 2013},
  pages        = {2345--2349},
  publisher    = {{ISCA}},
  year         = {2013},
  url          = {https://doi.org/10.21437/Interspeech.2013-548},
  doi          = {10.21437/INTERSPEECH.2013-548},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/VeselyGBP13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/csl/PoveyY12,
  author       = {Daniel Povey and
                  Kaisheng Yao},
  title        = {A basis representation of constrained {MLLR} transforms for robust
                  adaptation},
  journal      = {Comput. Speech Lang.},
  volume       = {26},
  number       = {1},
  pages        = {35--51},
  year         = {2012},
  url          = {https://doi.org/10.1016/j.csl.2011.04.002},
  doi          = {10.1016/J.CSL.2011.04.002},
  timestamp    = {Thu, 20 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/csl/PoveyY12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/VinyalsRP12,
  author       = {Oriol Vinyals and
                  Suman V. Ravuri and
                  Daniel Povey},
  title        = {Revisiting Recurrent Neural Networks for robust {ASR}},
  booktitle    = {2012 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2012, Kyoto, Japan, March 25-30, 2012},
  pages        = {4085--4088},
  publisher    = {{IEEE}},
  year         = {2012},
  url          = {https://doi.org/10.1109/ICASSP.2012.6288816},
  doi          = {10.1109/ICASSP.2012.6288816},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/VinyalsRP12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/PoveyHBBGJKKMQRVV12,
  author       = {Daniel Povey and
                  Mirko Hannemann and
                  Gilles Boulianne and
                  Luk{\'{a}}s Burget and
                  Arnab Ghoshal and
                  Milos Janda and
                  Martin Karafi{\'{a}}t and
                  Stefan Kombrink and
                  Petr Motl{\'{\i}}cek and
                  Yanmin Qian and
                  Korbinian Riedhammer and
                  Karel Vesel{\'{y}} and
                  Ngoc Thang Vu},
  title        = {Generating exact lattices in the {WFST} framework},
  booktitle    = {2012 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2012, Kyoto, Japan, March 25-30, 2012},
  pages        = {4213--4216},
  publisher    = {{IEEE}},
  year         = {2012},
  url          = {https://doi.org/10.1109/ICASSP.2012.6288848},
  doi          = {10.1109/ICASSP.2012.6288848},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/PoveyHBBGJKKMQRVV12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/VuSP12,
  author       = {Ngoc Thang Vu and
                  Tanja Schultz and
                  Daniel Povey},
  title        = {Modeling gender dependency in the Subspace {GMM} framework},
  booktitle    = {2012 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2012, Kyoto, Japan, March 25-30, 2012},
  pages        = {4345--4348},
  publisher    = {{IEEE}},
  year         = {2012},
  url          = {https://doi.org/10.1109/ICASSP.2012.6288881},
  doi          = {10.1109/ICASSP.2012.6288881},
  timestamp    = {Sat, 31 Jul 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/VuSP12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/RiedhammerBGP12,
  author       = {Korbinian Riedhammer and
                  Tobias Bocklet and
                  Arnab Ghoshal and
                  Daniel Povey},
  title        = {Revisiting semi-continuous hidden Markov models},
  booktitle    = {2012 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2012, Kyoto, Japan, March 25-30, 2012},
  pages        = {4721--4724},
  publisher    = {{IEEE}},
  year         = {2012},
  url          = {https://doi.org/10.1109/ICASSP.2012.6288973},
  doi          = {10.1109/ICASSP.2012.6288973},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/RiedhammerBGP12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/WengJP12,
  author       = {Chao Weng and
                  Biing{-}Hwang Juang and
                  Daniel Povey},
  title        = {Discriminative Training Using Non-uniform Criteria for Keyword Spotting
                  on Spontaneous Speech},
  booktitle    = {13th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2012, Portland, Oregon, USA, September 9-13, 2012},
  pages        = {559--562},
  publisher    = {{ISCA}},
  year         = {2012},
  url          = {https://doi.org/10.21437/Interspeech.2012-172},
  doi          = {10.21437/INTERSPEECH.2012-172},
  timestamp    = {Tue, 11 Jun 2024 16:45:43 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/WengJP12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/jmlr/VinyalsP12,
  author       = {Oriol Vinyals and
                  Daniel Povey},
  editor       = {Neil D. Lawrence and
                  Mark A. Girolami},
  title        = {Krylov Subspace Descent for Deep Learning},
  booktitle    = {Proceedings of the Fifteenth International Conference on Artificial
                  Intelligence and Statistics, {AISTATS} 2012, La Palma, Canary Islands,
                  Spain, April 21-23, 2012},
  series       = {{JMLR} Proceedings},
  volume       = {22},
  pages        = {1261--1268},
  publisher    = {JMLR.org},
  year         = {2012},
  url          = {http://proceedings.mlr.press/v22/vinyals12.html},
  timestamp    = {Wed, 29 May 2019 08:41:44 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/VinyalsP12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/csl/PoveyBAAKGGGKRRST11,
  author       = {Daniel Povey and
                  Luk{\'{a}}s Burget and
                  Mohit Agarwal and
                  Pinar Akyazi and
                  Kai Feng and
                  Arnab Ghoshal and
                  Ondrej Glembek and
                  Nagendra K. Goel and
                  Martin Karafi{\'{a}}t and
                  Ariya Rastrow and
                  Richard C. Rose and
                  Petr Schwarz and
                  Samuel Thomas},
  title        = {The subspace Gaussian mixture model - {A} structured model for speech
                  recognition},
  journal      = {Comput. Speech Lang.},
  volume       = {25},
  number       = {2},
  pages        = {404--439},
  year         = {2011},
  url          = {https://doi.org/10.1016/j.csl.2010.06.003},
  doi          = {10.1016/J.CSL.2010.06.003},
  timestamp    = {Thu, 24 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/csl/PoveyBAAKGGGKRRST11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/csl/XuPMZ11,
  author       = {Haihua Xu and
                  Daniel Povey and
                  Lidia Mangu and
                  Jie Zhu},
  title        = {Minimum Bayes Risk decoding and system combination based on a recursion
                  for edit distance},
  journal      = {Comput. Speech Lang.},
  volume       = {25},
  number       = {4},
  pages        = {802--828},
  year         = {2011},
  url          = {https://doi.org/10.1016/j.csl.2011.03.001},
  doi          = {10.1016/J.CSL.2011.03.001},
  timestamp    = {Thu, 20 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/csl/XuPMZ11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/asru/PoveyZA11,
  author       = {Daniel Povey and
                  Geoffrey Zweig and
                  Alex Acero},
  editor       = {David Nahamoo and
                  Michael Picheny},
  title        = {Speaker adaptation with an Exponential Transform},
  booktitle    = {2011 {IEEE} Workshop on Automatic Speech Recognition {\&} Understanding,
                  {ASRU} 2011, Waikoloa, HI, USA, December 11-15, 2011},
  pages        = {158--163},
  publisher    = {{IEEE}},
  year         = {2011},
  url          = {https://doi.org/10.1109/ASRU.2011.6163923},
  doi          = {10.1109/ASRU.2011.6163923},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/asru/PoveyZA11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/asru/MikolovDPBC11,
  author       = {Tom{\'{a}}s Mikolov and
                  Anoop Deoras and
                  Daniel Povey and
                  Luk{\'{a}}s Burget and
                  Jan Cernock{\'{y}}},
  editor       = {David Nahamoo and
                  Michael Picheny},
  title        = {Strategies for training large scale neural network language models},
  booktitle    = {2011 {IEEE} Workshop on Automatic Speech Recognition {\&} Understanding,
                  {ASRU} 2011, Waikoloa, HI, USA, December 11-15, 2011},
  pages        = {196--201},
  publisher    = {{IEEE}},
  year         = {2011},
  url          = {https://doi.org/10.1109/ASRU.2011.6163930},
  doi          = {10.1109/ASRU.2011.6163930},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/asru/MikolovDPBC11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/asru/QianXPL11,
  author       = {Yanmin Qian and
                  Ji Xu and
                  Daniel Povey and
                  Jia Liu},
  editor       = {David Nahamoo and
                  Michael Picheny},
  title        = {Strategies for using {MLP} based features with limited target-language
                  training data},
  booktitle    = {2011 {IEEE} Workshop on Automatic Speech Recognition {\&} Understanding,
                  {ASRU} 2011, Waikoloa, HI, USA, December 11-15, 2011},
  pages        = {354--358},
  publisher    = {{IEEE}},
  year         = {2011},
  url          = {https://doi.org/10.1109/ASRU.2011.6163957},
  doi          = {10.1109/ASRU.2011.6163957},
  timestamp    = {Mon, 20 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/asru/QianXPL11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/PoveyY11,
  author       = {Daniel Povey and
                  Kaisheng Yao},
  title        = {A basis method for robust estimation of constrained {MLLR}},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2011, May 22-27, 2011, Prague Congress
                  Center, Prague, Czech Republic},
  pages        = {4460--4463},
  publisher    = {{IEEE}},
  year         = {2011},
  url          = {https://doi.org/10.1109/ICASSP.2011.5947344},
  doi          = {10.1109/ICASSP.2011.5947344},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/PoveyY11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/PoveyKGS11,
  author       = {Daniel Povey and
                  Martin Karafi{\'{a}}t and
                  Arnab Ghoshal and
                  Petr Schwarz},
  title        = {A symmetrization of the Subspace Gaussian Mixture Model},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2011, May 22-27, 2011, Prague Congress
                  Center, Prague, Czech Republic},
  pages        = {4504--4507},
  publisher    = {{IEEE}},
  year         = {2011},
  url          = {https://doi.org/10.1109/ICASSP.2011.5947355},
  doi          = {10.1109/ICASSP.2011.5947355},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/PoveyKGS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/QianPL11,
  author       = {Yanmin Qian and
                  Daniel Povey and
                  Jia Liu},
  title        = {State-Level Data Borrowing for Low-Resource Speech Recognition Based
                  on Subspace GMMs},
  booktitle    = {12th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2011, Florence, Italy, August 27-31, 2011},
  pages        = {553--560},
  publisher    = {{ISCA}},
  year         = {2011},
  url          = {https://doi.org/10.21437/Interspeech.2011-229},
  doi          = {10.21437/INTERSPEECH.2011-229},
  timestamp    = {Tue, 11 Jun 2024 16:45:43 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/QianPL11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/ChuP10,
  author       = {Stephen M. Chu and
                  Daniel Povey},
  title        = {Speaking rate adaptation using continuous frame rate normalization},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2010, 14-19 March 2010, Sheraton Dallas
                  Hotel, Dallas, Texas, {USA}},
  pages        = {4306--4309},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://doi.org/10.1109/ICASSP.2010.5495656},
  doi          = {10.1109/ICASSP.2010.5495656},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/ChuP10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/GhoshalPAABFGGKRRST10,
  author       = {Arnab Ghoshal and
                  Daniel Povey and
                  Mohit Agarwal and
                  Pinar Akyazi and
                  Luk{\'{a}}s Burget and
                  Kai Feng and
                  Ondrej Glembek and
                  Nagendra Goel and
                  Martin Karafi{\'{a}}t and
                  Ariya Rastrow and
                  Richard C. Rose and
                  Petr Schwarz and
                  Samuel Thomas},
  title        = {A novel estimation of feature-space {MLLR} for full-covariance models},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2010, 14-19 March 2010, Sheraton Dallas
                  Hotel, Dallas, Texas, {USA}},
  pages        = {4310--4313},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://doi.org/10.1109/ICASSP.2010.5495657},
  doi          = {10.1109/ICASSP.2010.5495657},
  timestamp    = {Thu, 24 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/GhoshalPAABFGGKRRST10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/PoveyBAAFGGGKRRST10,
  author       = {Daniel Povey and
                  Luk{\'{a}}s Burget and
                  Mohit Agarwal and
                  Pinar Akyazi and
                  Kai Feng and
                  Arnab Ghoshal and
                  Ondrej Glembek and
                  Nagendra K. Goel and
                  Martin Karafi{\'{a}}t and
                  Ariya Rastrow and
                  Richard C. Rose and
                  Petr Schwarz and
                  Samuel Thomas},
  title        = {Subspace Gaussian Mixture Models for speech recognition},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2010, 14-19 March 2010, Sheraton Dallas
                  Hotel, Dallas, Texas, {USA}},
  pages        = {4330--4333},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://doi.org/10.1109/ICASSP.2010.5495662},
  doi          = {10.1109/ICASSP.2010.5495662},
  timestamp    = {Thu, 24 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/PoveyBAAFGGGKRRST10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/BurgetSAAFGGGKPRRT10,
  author       = {Luk{\'{a}}s Burget and
                  Petr Schwarz and
                  Mohit Agarwal and
                  Pinar Akyazi and
                  Kai Feng and
                  Arnab Ghoshal and
                  Ondrej Glembek and
                  Nagendra K. Goel and
                  Martin Karafi{\'{a}}t and
                  Daniel Povey and
                  Ariya Rastrow and
                  Richard C. Rose and
                  Samuel Thomas},
  title        = {Multilingual acoustic modeling for speech recognition based on subspace
                  Gaussian Mixture Models},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2010, 14-19 March 2010, Sheraton Dallas
                  Hotel, Dallas, Texas, {USA}},
  pages        = {4334--4337},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://doi.org/10.1109/ICASSP.2010.5495646},
  doi          = {10.1109/ICASSP.2010.5495646},
  timestamp    = {Thu, 24 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/BurgetSAAFGGGKPRRT10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/ChuPKMZSQ10,
  author       = {Stephen M. Chu and
                  Daniel Povey and
                  Hong{-}Kwang Kuo and
                  Lidia Mangu and
                  Shilei Zhang and
                  Qin Shi and
                  Yong Qin},
  title        = {The 2009 {IBM} {GALE} Mandarin broadcast transcription system},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2010, 14-19 March 2010, Sheraton Dallas
                  Hotel, Dallas, Texas, {USA}},
  pages        = {4374--4377},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://doi.org/10.1109/ICASSP.2010.5495639},
  doi          = {10.1109/ICASSP.2010.5495639},
  timestamp    = {Thu, 23 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/ChuPKMZSQ10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/SaonSCCKKMP10,
  author       = {George Saon and
                  Hagen Soltau and
                  Upendra V. Chaudhari and
                  Stephen M. Chu and
                  Brian Kingsbury and
                  Hong{-}Kwang Kuo and
                  Lidia Mangu and
                  Daniel Povey},
  title        = {The {IBM} 2008 {GALE} Arabic speech transcription system},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2010, 14-19 March 2010, Sheraton Dallas
                  Hotel, Dallas, Texas, {USA}},
  pages        = {4378--4381},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://doi.org/10.1109/ICASSP.2010.5495640},
  doi          = {10.1109/ICASSP.2010.5495640},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/SaonSCCKKMP10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/XuPMZ10,
  author       = {Haihua Xu and
                  Daniel Povey and
                  Lidia Mangu and
                  Jie Zhu},
  title        = {An improved consensus-like method for Minimum Bayes Risk decoding
                  and lattice combination},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2010, 14-19 March 2010, Sheraton Dallas
                  Hotel, Dallas, Texas, {USA}},
  pages        = {4938--4941},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://doi.org/10.1109/ICASSP.2010.5495100},
  doi          = {10.1109/ICASSP.2010.5495100},
  timestamp    = {Thu, 19 Dec 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/XuPMZ10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/GoelTAABFGGKPRRS10,
  author       = {Nagendra Goel and
                  Samuel Thomas and
                  Mohit Agarwal and
                  Pinar Akyazi and
                  Luk{\'{a}}s Burget and
                  Kai Feng and
                  Arnab Ghoshal and
                  Ondrej Glembek and
                  Martin Karafi{\'{a}}t and
                  Daniel Povey and
                  Ariya Rastrow and
                  Richard C. Rose and
                  Petr Schwarz},
  title        = {Approaches to automatic lexicon learning with limited training examples},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2010, 14-19 March 2010, Sheraton Dallas
                  Hotel, Dallas, Texas, {USA}},
  pages        = {5094--5097},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://doi.org/10.1109/ICASSP.2010.5495037},
  doi          = {10.1109/ICASSP.2010.5495037},
  timestamp    = {Thu, 24 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/GoelTAABFGGKPRRS10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/SoltauSKKMPE09,
  author       = {Hagen Soltau and
                  George Saon and
                  Brian Kingsbury and
                  Hong{-}Kwang Jeff Kuo and
                  Lidia Mangu and
                  Daniel Povey and
                  Ahmad Emami},
  title        = {Advances in Arabic Speech Transcription at {IBM} Under the {DARPA}
                  {GALE} Program},
  journal      = {{IEEE} Trans. Speech Audio Process.},
  volume       = {17},
  number       = {5},
  pages        = {884--894},
  year         = {2009},
  url          = {https://doi.org/10.1109/TASL.2009.2022966},
  doi          = {10.1109/TASL.2009.2022966},
  timestamp    = {Sun, 17 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/taslp/SoltauSKKMPE09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/SaonPS09,
  author       = {George Saon and
                  Daniel Povey and
                  Hagen Soltau},
  title        = {Large margin semi-tied covariance transforms for discriminative training},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2009, 19-24 April 2009, Taipei, Taiwan},
  pages        = {3753--3756},
  publisher    = {{IEEE}},
  year         = {2009},
  url          = {https://doi.org/10.1109/ICASSP.2009.4960443},
  doi          = {10.1109/ICASSP.2009.4960443},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/SaonPS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/XuPZW09,
  author       = {Haihua Xu and
                  Daniel Povey and
                  Jie Zhu and
                  Guanyong Wu},
  title        = {Minimum hypothesis phone error as a decoding method for speech recognition},
  booktitle    = {10th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2009, Brighton, United Kingdom, September 6-10, 2009},
  pages        = {76--79},
  publisher    = {{ISCA}},
  year         = {2009},
  url          = {https://doi.org/10.21437/Interspeech.2009-17},
  doi          = {10.21437/INTERSPEECH.2009-17},
  timestamp    = {Tue, 11 Jun 2024 16:45:43 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/XuPZW09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/PoveyKKRSV08,
  author       = {Daniel Povey and
                  Dimitri Kanevsky and
                  Brian Kingsbury and
                  Bhuvana Ramabhadran and
                  George Saon and
                  Karthik Visweswariah},
  title        = {Boosted {MMI} for model and feature-space discriminative training},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2008, March 30 - April 4, 2008, Caesars
                  Palace, Las Vegas, Nevada, {USA}},
  pages        = {4057--4060},
  publisher    = {{IEEE}},
  year         = {2008},
  url          = {https://doi.org/10.1109/ICASSP.2008.4518545},
  doi          = {10.1109/ICASSP.2008.4518545},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/PoveyKKRSV08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/VaradarajanPC08,
  author       = {Balakrishnan Varadarajan and
                  Daniel Povey and
                  Selina M. Chu},
  title        = {Quick fmllr for speaker adaptation in speech recognition},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2008, March 30 - April 4, 2008, Caesars
                  Palace, Las Vegas, Nevada, {USA}},
  pages        = {4297--4300},
  publisher    = {{IEEE}},
  year         = {2008},
  url          = {https://doi.org/10.1109/ICASSP.2008.4518605},
  doi          = {10.1109/ICASSP.2008.4518605},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/VaradarajanPC08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/PoveyCV08,
  author       = {Daniel Povey and
                  Selina M. Chu and
                  Balakrishnan Varadarajan},
  title        = {Universal background model based speech recognition},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2008, March 30 - April 4, 2008, Caesars
                  Palace, Las Vegas, Nevada, {USA}},
  pages        = {4561--4564},
  publisher    = {{IEEE}},
  year         = {2008},
  url          = {https://doi.org/10.1109/ICASSP.2008.4518671},
  doi          = {10.1109/ICASSP.2008.4518671},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/PoveyCV08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/SaonP08,
  author       = {George Saon and
                  Daniel Povey},
  title        = {Penalty function maximization for large margin {HMM} training},
  booktitle    = {9th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2008, Brisbane, Australia, September 22-26, 2008},
  pages        = {920--923},
  publisher    = {{ISCA}},
  year         = {2008},
  url          = {https://doi.org/10.21437/Interspeech.2008-108},
  doi          = {10.21437/INTERSPEECH.2008-108},
  timestamp    = {Tue, 11 Jun 2024 16:45:43 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/SaonP08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/PoveyKS08,
  author       = {Daniel Povey and
                  Hong{-}Kwang Jeff Kuo and
                  Hagen Soltau},
  title        = {Fast speaker adaptive training for speech recognition},
  booktitle    = {9th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2008, Brisbane, Australia, September 22-26, 2008},
  pages        = {1245--1248},
  publisher    = {{ISCA}},
  year         = {2008},
  url          = {https://doi.org/10.21437/Interspeech.2008-377},
  doi          = {10.21437/INTERSPEECH.2008-377},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/PoveyKS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/PoveyK08,
  author       = {Daniel Povey and
                  Brian Kingsbury},
  title        = {Monte Carlo model-space noise adaptation for speech recognition},
  booktitle    = {9th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2008, Brisbane, Australia, September 22-26, 2008},
  pages        = {1281--1284},
  publisher    = {{ISCA}},
  year         = {2008},
  url          = {https://doi.org/10.21437/Interspeech.2008-308},
  doi          = {10.21437/INTERSPEECH.2008-308},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/PoveyK08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/PoveyK08a,
  author       = {Daniel Povey and
                  Hong{-}Kwang Jeff Kuo},
  title        = {{XMLLR} for improved speaker adaptation in speech recognition},
  booktitle    = {9th Annual Conference of the International Speech Communication Association,
                  {INTERSPEECH} 2008, Brisbane, Australia, September 22-26, 2008},
  pages        = {1705--1708},
  publisher    = {{ISCA}},
  year         = {2008},
  url          = {https://doi.org/10.21437/Interspeech.2008-380},
  doi          = {10.21437/INTERSPEECH.2008-380},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/PoveyK08a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/PoveyK07,
  author       = {Daniel Povey and
                  Brian Kingsbury},
  title        = {Evaluation of Proposed Modifications to {MPE} for Large Scale Discriminative
                  Training},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2007, Honolulu, Hawaii, USA, April
                  15-20, 2007},
  pages        = {321--324},
  publisher    = {{IEEE}},
  year         = {2007},
  url          = {https://doi.org/10.1109/ICASSP.2007.366914},
  doi          = {10.1109/ICASSP.2007.366914},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/PoveyK07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/SoltauSKKMPZ07,
  author       = {Hagen Soltau and
                  George Saon and
                  Brian Kingsbury and
                  Hong{-}Kwang Jeff Kuo and
                  Lidia Mangu and
                  Daniel Povey and
                  Geoffrey Zweig},
  title        = {The {IBM} 2006 Gale Arabic {ASR} System},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2007, Honolulu, Hawaii, USA, April
                  15-20, 2007},
  pages        = {349--352},
  publisher    = {{IEEE}},
  year         = {2007},
  url          = {https://doi.org/10.1109/ICASSP.2007.366921},
  doi          = {10.1109/ICASSP.2007.366921},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/SoltauSKKMPZ07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/SarikayaZPAG07,
  author       = {Ruhi Sarikaya and
                  Bowen Zhou and
                  Daniel Povey and
                  Mohamed Afify and
                  Yuqing Gao},
  title        = {The Impact of {ASR} on Speech-to-Speech Translation Performance},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2007, Honolulu, Hawaii, USA, April
                  15-20, 2007},
  pages        = {1289--1292},
  publisher    = {{IEEE}},
  year         = {2007},
  url          = {https://doi.org/10.1109/ICASSP.2007.367313},
  doi          = {10.1109/ICASSP.2007.367313},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/SarikayaZPAG07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/HainWEGLMPW06,
  author       = {Thomas Hain and
                  Philip C. Woodland and
                  Gunnar Evermann and
                  Mark J. F. Gales and
                  Xunying Liu and
                  Gareth L. Moore and
                  Daniel Povey and
                  Lan Wang},
  title        = {Corrections to "Automatic Transcription of Conversational Telephone
                  Speech"},
  journal      = {{IEEE} Trans. Speech Audio Process.},
  volume       = {14},
  number       = {2},
  pages        = {727--727},
  year         = {2006},
  url          = {https://doi.org/10.1109/TASL.2006.871051},
  doi          = {10.1109/TASL.2006.871051},
  timestamp    = {Fri, 03 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/taslp/HainWEGLMPW06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/ChenKMPSSZ06,
  author       = {Stanley F. Chen and
                  Brian Kingsbury and
                  Lidia Mangu and
                  Daniel Povey and
                  George Saon and
                  Hagen Soltau and
                  Geoffrey Zweig},
  title        = {Advances in speech transcription at {IBM} under the {DARPA} {EARS}
                  program},
  journal      = {{IEEE} Trans. Speech Audio Process.},
  volume       = {14},
  number       = {5},
  pages        = {1596--1608},
  year         = {2006},
  url          = {https://doi.org/10.1109/TASL.2006.879814},
  doi          = {10.1109/TASL.2006.879814},
  timestamp    = {Sun, 17 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/taslp/ChenKMPSSZ06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/PelecanosPR06,
  author       = {Jason W. Pelecanos and
                  Daniel Povey and
                  Ganesh N. Ramaswamy},
  title        = {Secondary Classification for {GMM} Based Speaker Recognition},
  booktitle    = {2006 {IEEE} International Conference on Acoustics Speech and Signal
                  Processing, {ICASSP} 2006, Toulouse, France, May 14-19, 2006},
  pages        = {109--112},
  publisher    = {{IEEE}},
  year         = {2006},
  url          = {https://doi.org/10.1109/ICASSP.2006.1659969},
  doi          = {10.1109/ICASSP.2006.1659969},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/PelecanosPR06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/ZweigSSRPMK06,
  author       = {Geoffrey Zweig and
                  Olivier Siohan and
                  George Saon and
                  Bhuvana Ramabhadran and
                  Daniel Povey and
                  Lidia Mangu and
                  Brian Kingsbury},
  title        = {Automated Quality Monitoring in the Call Center with {ASR} and Maximum
                  Entropy},
  booktitle    = {2006 {IEEE} International Conference on Acoustics Speech and Signal
                  Processing, {ICASSP} 2006, Toulouse, France, May 14-19, 2006},
  pages        = {589--592},
  publisher    = {{IEEE}},
  year         = {2006},
  url          = {https://doi.org/10.1109/ICASSP.2006.1660089},
  doi          = {10.1109/ICASSP.2006.1660089},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/ZweigSSRPMK06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/ChoueiterPCZ06,
  author       = {Ghinwa F. Choueiter and
                  Daniel Povey and
                  Stanley F. Chen and
                  Geoffrey Zweig},
  title        = {Morpheme-Based Language Modeling for Arabic Lvcsr},
  booktitle    = {2006 {IEEE} International Conference on Acoustics Speech and Signal
                  Processing, {ICASSP} 2006, Toulouse, France, May 14-19, 2006},
  pages        = {1053--1056},
  publisher    = {{IEEE}},
  year         = {2006},
  url          = {https://doi.org/10.1109/ICASSP.2006.1660205},
  doi          = {10.1109/ICASSP.2006.1660205},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/ChoueiterPCZ06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/Povey06,
  author       = {Daniel Povey},
  title        = {{SPAM} and full covariance for speech recognition},
  booktitle    = {Ninth International Conference on Spoken Language Processing, {INTERSPEECH-ICSLP}
                  2006, Pittsburgh, PA, USA, September 17-21, 2006},
  publisher    = {{ISCA}},
  year         = {2006},
  url          = {https://doi.org/10.21437/Interspeech.2006-437},
  doi          = {10.21437/INTERSPEECH.2006-437},
  timestamp    = {Tue, 11 Jun 2024 16:45:43 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/Povey06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/PoveyS06,
  author       = {Daniel Povey and
                  George Saon},
  title        = {Feature and model space speaker adaptation with full covariance Gaussians},
  booktitle    = {Ninth International Conference on Spoken Language Processing, {INTERSPEECH-ICSLP}
                  2006, Pittsburgh, PA, USA, September 17-21, 2006},
  publisher    = {{ISCA}},
  year         = {2006},
  url          = {https://doi.org/10.21437/Interspeech.2006-349},
  doi          = {10.21437/INTERSPEECH.2006-349},
  timestamp    = {Thu, 22 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/PoveyS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/mlmi/HuangWCSPLSSRP06,
  author       = {Jing Huang and
                  Martin Westphal and
                  Stanley F. Chen and
                  Olivier Siohan and
                  Daniel Povey and
                  Vit Libal and
                  Alvaro Soneiro and
                  Henrik Schulz and
                  Thomas Ross and
                  Gerasimos Potamianos},
  editor       = {Steve Renals and
                  Samy Bengio and
                  Jonathan G. Fiscus},
  title        = {The {IBM} Rich Transcription Spring 2006 Speech-to-Text System for
                  Lecture Meetings},
  booktitle    = {Machine Learning for Multimodal Interaction, Third International Workshop,
                  {MLMI} 2006, Bethesda, MD, USA, May 1-4, 2006, Revised Selected Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {4299},
  pages        = {432--443},
  publisher    = {Springer},
  year         = {2006},
  url          = {https://doi.org/10.1007/11965152\_38},
  doi          = {10.1007/11965152\_38},
  timestamp    = {Fri, 10 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/mlmi/HuangWCSPLSSRP06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/naacl/ZweigSSRPMK06,
  author       = {Geoffrey Zweig and
                  Olivier Siohan and
                  George Saon and
                  Bhuvana Ramabhadran and
                  Daniel Povey and
                  Lidia Mangu and
                  Brian Kingsbury},
  editor       = {Robert C. Moore and
                  Jeff A. Bilmes and
                  Jennifer Chu{-}Carroll and
                  Mark Sanderson},
  title        = {Automated Quality Monitoring for Call Centers using Speech and {NLP}
                  Technologies},
  booktitle    = {Human Language Technology Conference of the North American Chapter
                  of the Association of Computational Linguistics, Proceedings, June
                  4-9, 2006, New York, New York, {USA}},
  publisher    = {The Association for Computational Linguistics},
  year         = {2006},
  url          = {https://aclanthology.org/N06-4011/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/naacl/ZweigSSRPMK06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/HainWEGLMPW05,
  author       = {Thomas Hain and
                  Philip C. Woodland and
                  Gunnar Evermann and
                  Mark J. F. Gales and
                  Xunying Liu and
                  Gareth L. Moore and
                  Daniel Povey and
                  Lan Wang},
  title        = {Automatic transcription of conversational telephone speech},
  journal      = {{IEEE} Trans. Speech Audio Process.},
  volume       = {13},
  number       = {6},
  pages        = {1173--1185},
  year         = {2005},
  url          = {https://doi.org/10.1109/TSA.2005.852999},
  doi          = {10.1109/TSA.2005.852999},
  timestamp    = {Fri, 09 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/taslp/HainWEGLMPW05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/SoltauKMPSZ05,
  author       = {Hagen Soltau and
                  Brian Kingsbury and
                  Lidia Mangu and
                  Daniel Povey and
                  George Saon and
                  Geoffrey Zweig},
  title        = {The {IBM} 2004 Conversational Telephony System for Rich Transcription},
  booktitle    = {2005 {IEEE} International Conference on Acoustics, Speech, and Signal
                  Processing, {ICASSP} '05, Philadelphia, Pennsylvania, USA, March 18-23,
                  2005},
  pages        = {205--208},
  publisher    = {{IEEE}},
  year         = {2005},
  url          = {https://doi.org/10.1109/ICASSP.2005.1415086},
  doi          = {10.1109/ICASSP.2005.1415086},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/SoltauKMPSZ05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/PoveyKMSSZ05,
  author       = {Daniel Povey and
                  Brian Kingsbury and
                  Lidia Mangu and
                  George Saon and
                  Hagen Soltau and
                  Geoffrey Zweig},
  title        = {fMPE: Discriminatively Trained Features for Speech Recognition},
  booktitle    = {2005 {IEEE} International Conference on Acoustics, Speech, and Signal
                  Processing, {ICASSP} '05, Philadelphia, Pennsylvania, USA, March 18-23,
                  2005},
  pages        = {961--964},
  publisher    = {{IEEE}},
  year         = {2005},
  url          = {https://doi.org/10.1109/ICASSP.2005.1415275},
  doi          = {10.1109/ICASSP.2005.1415275},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/PoveyKMSSZ05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/SaonPZ05,
  author       = {George Saon and
                  Daniel Povey and
                  Geoffrey Zweig},
  title        = {Anatomy of an extremely fast {LVCSR} decoder},
  booktitle    = {9th European Conference on Speech Communication and Technology, INTERSPEECH-Eurospeech
                  2005, Lisbon, Portugal, September 4-8, 2005},
  pages        = {549--552},
  publisher    = {{ISCA}},
  year         = {2005},
  url          = {https://doi.org/10.21437/Interspeech.2005-338},
  doi          = {10.21437/INTERSPEECH.2005-338},
  timestamp    = {Tue, 11 Jun 2024 16:45:43 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/SaonPZ05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/HuangP05,
  author       = {Jing Huang and
                  Daniel Povey},
  title        = {Discriminatively trained features using fMPE for multi-stream audio-visual
                  speech recognition},
  booktitle    = {9th European Conference on Speech Communication and Technology, INTERSPEECH-Eurospeech
                  2005, Lisbon, Portugal, September 4-8, 2005},
  pages        = {777--780},
  publisher    = {{ISCA}},
  year         = {2005},
  url          = {https://doi.org/10.21437/Interspeech.2005-361},
  doi          = {10.21437/INTERSPEECH.2005-361},
  timestamp    = {Thu, 22 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/HuangP05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/Povey05,
  author       = {Daniel Povey},
  title        = {Improvements to fMPE for discriminative training of features},
  booktitle    = {9th European Conference on Speech Communication and Technology, INTERSPEECH-Eurospeech
                  2005, Lisbon, Portugal, September 4-8, 2005},
  pages        = {2977--2980},
  publisher    = {{ISCA}},
  year         = {2005},
  url          = {https://doi.org/10.21437/Interspeech.2005-133},
  doi          = {10.21437/INTERSPEECH.2005-133},
  timestamp    = {Thu, 22 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/Povey05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/SaonDP04,
  author       = {George Saon and
                  Satya Dharanipragada and
                  Daniel Povey},
  title        = {Feature space Gaussianization},
  booktitle    = {2004 {IEEE} International Conference on Acoustics, Speech, and Signal
                  Processing, {ICASSP} 2004, Montreal, Quebec, Canada, May 17-21, 2004},
  pages        = {329--332},
  publisher    = {{IEEE}},
  year         = {2004},
  url          = {https://doi.org/10.1109/ICASSP.2004.1325989},
  doi          = {10.1109/ICASSP.2004.1325989},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/SaonDP04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/Povey04,
  author       = {Daniel Povey},
  title        = {Phone duration modeling for {LVCSR}},
  booktitle    = {2004 {IEEE} International Conference on Acoustics, Speech, and Signal
                  Processing, {ICASSP} 2004, Montreal, Quebec, Canada, May 17-21, 2004},
  pages        = {829--832},
  publisher    = {{IEEE}},
  year         = {2004},
  url          = {https://doi.org/10.1109/ICASSP.2004.1326114},
  doi          = {10.1109/ICASSP.2004.1326114},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/Povey04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/PoveyWG03,
  author       = {Daniel Povey and
                  Philip C. Woodland and
                  Mark J. F. Gales},
  title        = {Discriminative map for acoustic model adaptation},
  booktitle    = {2003 {IEEE} International Conference on Acoustics, Speech, and Signal
                  Processing, {ICASSP} '03, Hong Kong, April 6-10, 2003},
  pages        = {312--315},
  publisher    = {{IEEE}},
  year         = {2003},
  url          = {https://doi.org/10.1109/ICASSP.2003.1198780},
  doi          = {10.1109/ICASSP.2003.1198780},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/PoveyWG03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/GalesDPW03,
  author       = {Mark J. F. Gales and
                  Yuan Dong and
                  Daniel Povey and
                  Philip C. Woodland},
  title        = {Porting: SwitchBoard to the VoiceMail task},
  booktitle    = {2003 {IEEE} International Conference on Acoustics, Speech, and Signal
                  Processing, {ICASSP} '03, Hong Kong, April 6-10, 2003},
  pages        = {536--539},
  publisher    = {{IEEE}},
  year         = {2003},
  url          = {https://doi.org/10.1109/ICASSP.2003.1198836},
  doi          = {10.1109/ICASSP.2003.1198836},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/GalesDPW03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icdar/NopsuwanchaiP03,
  author       = {Roongroj Nopsuwanchai and
                  Daniel Povey},
  title        = {Discriminative Training for HMM-Based Offline Handwritten Character
                  Recognition},
  booktitle    = {7th International Conference on Document Analysis and Recognition
                  {(ICDAR} 2003), 2-Volume Set, 3-6 August 2003, Edinburgh, Scotland,
                  {UK}},
  pages        = {114--118},
  publisher    = {{IEEE} Computer Society},
  year         = {2003},
  url          = {https://doi.org/10.1109/ICDAR.2003.1227643},
  doi          = {10.1109/ICDAR.2003.1227643},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icdar/NopsuwanchaiP03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/PoveyGKW03,
  author       = {Daniel Povey and
                  Mark J. F. Gales and
                  Do Yeong Kim and
                  Philip C. Woodland},
  title        = {{MMI-MAP} and {MPE-MAP} for acoustic model adaptation},
  booktitle    = {8th European Conference on Speech Communication and Technology, {EUROSPEECH}
                  2003 - {INTERSPEECH} 2003, Geneva, Switzerland, September 1-4, 2003},
  pages        = {1981--1984},
  publisher    = {{ISCA}},
  year         = {2003},
  url          = {https://doi.org/10.21437/Eurospeech.2003-572},
  doi          = {10.21437/EUROSPEECH.2003-572},
  timestamp    = {Thu, 22 Jun 2023 16:42:17 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/PoveyGKW03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/csl/WoodlandP02,
  author       = {Philip C. Woodland and
                  Daniel Povey},
  title        = {Large scale discriminative training of hidden Markov models for speech
                  recognition},
  journal      = {Comput. Speech Lang.},
  volume       = {16},
  number       = {1},
  pages        = {25--47},
  year         = {2002},
  url          = {https://doi.org/10.1006/csla.2001.0182},
  doi          = {10.1006/CSLA.2001.0182},
  timestamp    = {Thu, 20 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/csl/WoodlandP02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/PoveyW02,
  author       = {Daniel Povey and
                  Philip C. Woodland},
  title        = {Minimum Phone Error and I-smoothing for improved discriminative training},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2002, May 13-17 2002, Orlando, Florida,
                  {USA}},
  pages        = {105--108},
  publisher    = {{IEEE}},
  year         = {2002},
  url          = {https://doi.org/10.1109/ICASSP.2002.5743665},
  doi          = {10.1109/ICASSP.2002.5743665},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/PoveyW02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/PoveyW01,
  author       = {Daniel Povey and
                  Philip C. Woodland},
  title        = {Improved discriminative training techniques for large vocabulary continuous
                  speech recognition},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech, and Signal Processing,
                  {ICASSP} 2001, 7-11 May, 2001, Salt Palace Convention Center, Salt
                  Lake City, Utah, USA, Proceedings},
  pages        = {45--48},
  publisher    = {{IEEE}},
  year         = {2001},
  url          = {https://doi.org/10.1109/ICASSP.2001.940763},
  doi          = {10.1109/ICASSP.2001.940763},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/PoveyW01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/HainWEP01,
  author       = {Thomas Hain and
                  Philip C. Woodland and
                  Gunnar Evermann and
                  Daniel Povey},
  title        = {New features in the {CU-HTK} system for transcription of conversational
                  telephone speech},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech, and Signal Processing,
                  {ICASSP} 2001, 7-11 May, 2001, Salt Palace Convention Center, Salt
                  Lake City, Utah, USA, Proceedings},
  pages        = {57--60},
  publisher    = {{IEEE}},
  year         = {2001},
  url          = {https://doi.org/10.1109/ICASSP.2001.940766},
  doi          = {10.1109/ICASSP.2001.940766},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/HainWEP01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/PoveyW99,
  author       = {Daniel Povey and
                  Philip C. Woodland},
  title        = {Frame discrimination training for HMMs for large vocabulary speech
                  recognition},
  booktitle    = {Proceedings of the 1999 {IEEE} International Conference on Acoustics,
                  Speech, and Signal Processing, {ICASSP} '99, Phoenix, Arizona, USA,
                  March 15-19, 1999},
  pages        = {333--336},
  publisher    = {{IEEE} Computer Society},
  year         = {1999},
  url          = {https://doi.org/10.1109/ICASSP.1999.758130},
  doi          = {10.1109/ICASSP.1999.758130},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/PoveyW99.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}