default search action
BibTeX records: George Saon
@inproceedings{DBLP:conf/icassp/UdagawaSKMS24, author = {Takuma Udagawa and Masayuki Suzuki and Gakuto Kurata and Masayasu Muraoka and George Saon}, title = {Multiple Representation Transfer from Large Language Models to End-to-End {ASR} Systems}, booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing, {ICASSP} 2024, Seoul, Republic of Korea, April 14-19, 2024}, pages = {10176--10180}, publisher = {{IEEE}}, year = {2024}, url = {https://doi.org/10.1109/ICASSP48485.2024.10448022}, doi = {10.1109/ICASSP48485.2024.10448022}, timestamp = {Tue, 06 Aug 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/UdagawaSKMS24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/AroraS0K24, author = {Siddhant Arora and George Saon and Shinji Watanabe and Brian Kingsbury}, title = {Semi-Autoregressive Streaming {ASR} with Label Context}, booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing, {ICASSP} 2024, Seoul, Republic of Korea, April 14-19, 2024}, pages = {11681--11685}, publisher = {{IEEE}}, year = {2024}, url = {https://doi.org/10.1109/ICASSP48485.2024.10446807}, doi = {10.1109/ICASSP48485.2024.10446807}, timestamp = {Wed, 07 Aug 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/AroraS0K24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2402-00235, author = {Ankit Gupta and George Saon and Brian Kingsbury}, title = {Exploring the limits of decoder-only models trained on public speech recognition corpora}, journal = {CoRR}, volume = {abs/2402.00235}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2402.00235}, doi = {10.48550/ARXIV.2402.00235}, eprinttype = {arXiv}, eprint = {2402.00235}, timestamp = {Fri, 09 Feb 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2402-00235.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/emnlp/MittalSJSK23, author = {Ashish R. Mittal and Sunita Sarawagi and Preethi Jyothi and George Saon and Gakuto Kurata}, editor = {Houda Bouamor and Juan Pino and Kalika Bali}, title = {Speech-enriched Memory for Inference-time Adaptation of {ASR} Models to Word Dictionaries}, booktitle = {Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing, {EMNLP} 2023, Singapore, December 6-10, 2023}, pages = {14820--14835}, publisher = {Association for Computational Linguistics}, year = {2023}, url = {https://doi.org/10.18653/v1/2023.emnlp-main.916}, doi = {10.18653/V1/2023.EMNLP-MAIN.916}, timestamp = {Fri, 12 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/emnlp/MittalSJSK23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/SaonGC23, author = {George Saon and Ankit Gupta and Xiaodong Cui}, title = {Diagonal State Space Augmented Transformers for Speech Recognition}, booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing {ICASSP} 2023, Rhodes Island, Greece, June 4-10, 2023}, pages = {1--5}, publisher = {{IEEE}}, year = {2023}, url = {https://doi.org/10.1109/ICASSP49357.2023.10096271}, doi = {10.1109/ICASSP49357.2023.10096271}, timestamp = {Sun, 05 Nov 2023 16:51:21 +0100}, biburl = {https://dblp.org/rec/conf/icassp/SaonGC23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/ThomasKSK23, author = {Samuel Thomas and Hong{-}Kwang Jeff Kuo and George Saon and Brian Kingsbury}, title = {Multi-Speaker Data Augmentation for Improved end-to-end Automatic Speech Recognition}, booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing {ICASSP} 2023, Rhodes Island, Greece, June 4-10, 2023}, pages = {1--5}, publisher = {{IEEE}}, year = {2023}, url = {https://doi.org/10.1109/ICASSP49357.2023.10095622}, doi = {10.1109/ICASSP49357.2023.10095622}, timestamp = {Sun, 05 Nov 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icassp/ThomasKSK23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/CuiSK23, author = {Xiaodong Cui and George Saon and Brian Kingsbury}, editor = {Naomi Harte and Julie Carson{-}Berndsen and Gareth Jones}, title = {Improving {RNN} Transducer Acoustic Models for English Conversational Speech Recognition}, booktitle = {24th Annual Conference of the International Speech Communication Association, Interspeech 2023, Dublin, Ireland, August 20-24, 2023}, pages = {1299--1303}, publisher = {{ISCA}}, year = {2023}, url = {https://doi.org/10.21437/Interspeech.2023-2207}, doi = {10.21437/INTERSPEECH.2023-2207}, timestamp = {Fri, 14 Jun 2024 14:12:12 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/CuiSK23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2302-14120, author = {George Saon and Ankit Gupta and Xiaodong Cui}, title = {Diagonal State Space Augmented Transformers for Speech Recognition}, journal = {CoRR}, volume = {abs/2302.14120}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2302.14120}, doi = {10.48550/ARXIV.2302.14120}, eprinttype = {arXiv}, eprint = {2302.14120}, timestamp = {Tue, 18 Apr 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2302-14120.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2309-04031, author = {Takuma Udagawa and Masayuki Suzuki and Gakuto Kurata and Masayasu Muraoka and George Saon}, title = {Multiple Representation Transfer from Large Language Models to End-to-End {ASR} Systems}, journal = {CoRR}, volume = {abs/2309.04031}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2309.04031}, doi = {10.48550/ARXIV.2309.04031}, eprinttype = {arXiv}, eprint = {2309.04031}, timestamp = {Tue, 12 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2309-04031.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2309-10926, author = {Siddhant Arora and George Saon and Shinji Watanabe and Brian Kingsbury}, title = {Semi-Autoregressive Streaming {ASR} With Label Context}, journal = {CoRR}, volume = {abs/2309.10926}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2309.10926}, doi = {10.48550/ARXIV.2309.10926}, eprinttype = {arXiv}, eprint = {2309.10926}, timestamp = {Mon, 25 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2309-10926.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2311-12727, author = {Xiaodong Cui and Ashish R. Mittal and Songtao Lu and Wei Zhang and George Saon and Brian Kingsbury}, title = {Soft Random Sampling: {A} Theoretical and Empirical Analysis}, journal = {CoRR}, volume = {abs/2311.12727}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2311.12727}, doi = {10.48550/ARXIV.2311.12727}, eprinttype = {arXiv}, eprint = {2311.12727}, timestamp = {Thu, 30 Nov 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2311-12727.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/BohnstinglGWSEP22, author = {Thomas Bohnstingl and Ayush Garg and Stanislaw Wozniak and George Saon and Evangelos Eleftheriou and Angeliki Pantazi}, title = {Speech Recognition Using Biologically-Inspired Neural Networks}, booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing, {ICASSP} 2022, Virtual and Singapore, 23-27 May 2022}, pages = {6992--6996}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.1109/ICASSP43922.2022.9747499}, doi = {10.1109/ICASSP43922.2022.9747499}, timestamp = {Wed, 07 Dec 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icassp/BohnstinglGWSEP22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/KuoTTKS22, author = {Hong{-}Kwang Jeff Kuo and Zolt{\'{a}}n T{\"{u}}ske and Samuel Thomas and Brian Kingsbury and George Saon}, title = {Improving End-to-end Models for Set Prediction in Spoken Language Understanding}, booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing, {ICASSP} 2022, Virtual and Singapore, 23-27 May 2022}, pages = {7162--7166}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.1109/ICASSP43922.2022.9746086}, doi = {10.1109/ICASSP43922.2022.9746086}, timestamp = {Tue, 07 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/KuoTTKS22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/ThomasKKS22, author = {Samuel Thomas and Hong{-}Kwang Jeff Kuo and Brian Kingsbury and George Saon}, title = {Towards Reducing the Need for Speech Training Data to Build Spoken Language Understanding Systems}, booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing, {ICASSP} 2022, Virtual and Singapore, 23-27 May 2022}, pages = {7932--7936}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.1109/ICASSP43922.2022.9747555}, doi = {10.1109/ICASSP43922.2022.9747555}, timestamp = {Tue, 07 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/ThomasKKS22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/ThomasKSK22, author = {Samuel Thomas and Brian Kingsbury and George Saon and Hong{-}Kwang Jeff Kuo}, title = {Integrating Text Inputs for Training and Adapting {RNN} Transducer {ASR} Models}, booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing, {ICASSP} 2022, Virtual and Singapore, 23-27 May 2022}, pages = {8127--8131}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.1109/ICASSP43922.2022.9747862}, doi = {10.1109/ICASSP43922.2022.9747862}, timestamp = {Tue, 07 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/ThomasKSK22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/KonsAMDK0S22, author = {Zvi Kons and Hagai Aronowitz and Edmilson da Silva Morais and Matheus Damasceno and Hong{-}Kwang Kuo and Samuel Thomas and George Saon}, editor = {Hanseok Ko and John H. L. Hansen}, title = {Extending RNN-T-based speech recognition systems with emotion and language classification}, booktitle = {23rd Annual Conference of the International Speech Communication Association, Interspeech 2022, Incheon, Korea, September 18-22, 2022}, pages = {546--549}, publisher = {{ISCA}}, year = {2022}, url = {https://doi.org/10.21437/Interspeech.2022-10480}, doi = {10.21437/INTERSPEECH.2022-10480}, timestamp = {Tue, 11 Jun 2024 16:45:43 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/KonsAMDK0S22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/ShiSH0K22, author = {Jiatong Shi and George Saon and David Haws and Shinji Watanabe and Brian Kingsbury}, editor = {Hanseok Ko and John H. L. Hansen}, title = {{VQ-T:} {RNN} Transducers using Vector-Quantized Prediction Network States}, booktitle = {23rd Annual Conference of the International Speech Communication Association, Interspeech 2022, Incheon, Korea, September 18-22, 2022}, pages = {1656--1660}, publisher = {{ISCA}}, year = {2022}, url = {https://doi.org/10.21437/Interspeech.2022-414}, doi = {10.21437/INTERSPEECH.2022-414}, timestamp = {Wed, 21 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/ShiSH0K22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/FasoliCSVSCKG22, author = {Andrea Fasoli and Chia{-}Yu Chen and Mauricio J. Serrano and Swagath Venkataramani and George Saon and Xiaodong Cui and Brian Kingsbury and Kailash Gopalakrishnan}, editor = {Hanseok Ko and John H. L. Hansen}, title = {Accelerating Inference and Language Model Fusion of Recurrent Neural Network Transducers via End-to-End 4-bit Quantization}, booktitle = {23rd Annual Conference of the International Speech Communication Association, Interspeech 2022, Incheon, Korea, September 18-22, 2022}, pages = {2038--2042}, publisher = {{ISCA}}, year = {2022}, url = {https://doi.org/10.21437/Interspeech.2022-413}, doi = {10.21437/INTERSPEECH.2022-413}, timestamp = {Wed, 21 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/FasoliCSVSCKG22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/CuiSNSFKK22, author = {Xiaodong Cui and George Saon and Tohru Nagano and Masayuki Suzuki and Takashi Fukuda and Brian Kingsbury and Gakuto Kurata}, editor = {Hanseok Ko and John H. L. Hansen}, title = {Improving Generalization of Deep Neural Network Acoustic Models with Length Perturbation and N-best Based Label Smoothing}, booktitle = {23rd Annual Conference of the International Speech Communication Association, Interspeech 2022, Incheon, Korea, September 18-22, 2022}, pages = {2638--2642}, publisher = {{ISCA}}, year = {2022}, url = {https://doi.org/10.21437/Interspeech.2022-821}, doi = {10.21437/INTERSPEECH.2022-821}, timestamp = {Wed, 21 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/CuiSNSFKK22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/Fukuda0SKSK22, author = {Takashi Fukuda and Samuel Thomas and Masayuki Suzuki and Gakuto Kurata and George Saon and Brian Kingsbury}, editor = {Hanseok Ko and John H. L. Hansen}, title = {Global {RNN} Transducer Models For Multi-dialect Speech Recognition}, booktitle = {23rd Annual Conference of the International Speech Communication Association, Interspeech 2022, Incheon, Korea, September 18-22, 2022}, pages = {3138--3142}, publisher = {{ISCA}}, year = {2022}, url = {https://doi.org/10.21437/Interspeech.2022-165}, doi = {10.21437/INTERSPEECH.2022-165}, timestamp = {Wed, 21 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/Fukuda0SKSK22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/UdagawaSKIS22, author = {Takuma Udagawa and Masayuki Suzuki and Gakuto Kurata and Nobuyasu Itoh and George Saon}, editor = {Hanseok Ko and John H. L. Hansen}, title = {Effect and Analysis of Large-scale Language Model Rescoring on Competitive {ASR} Systems}, booktitle = {23rd Annual Conference of the International Speech Communication Association, Interspeech 2022, Incheon, Korea, September 18-22, 2022}, pages = {3919--3923}, publisher = {{ISCA}}, year = {2022}, url = {https://doi.org/10.21437/Interspeech.2022-11123}, doi = {10.21437/INTERSPEECH.2022-11123}, timestamp = {Wed, 21 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/UdagawaSKIS22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2201-12105, author = {Hong{-}Kwang Jeff Kuo and Zolt{\'{a}}n T{\"{u}}ske and Samuel Thomas and Brian Kingsbury and George Saon}, title = {Improving End-to-End Models for Set Prediction in Spoken Language Understanding}, journal = {CoRR}, volume = {abs/2201.12105}, year = {2022}, url = {https://arxiv.org/abs/2201.12105}, eprinttype = {arXiv}, eprint = {2201.12105}, timestamp = {Wed, 02 Feb 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2201-12105.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2202-13155, author = {Samuel Thomas and Brian Kingsbury and George Saon and Hong{-}Kwang Jeff Kuo}, title = {Integrating Text Inputs For Training and Adapting {RNN} Transducer {ASR} Models}, journal = {CoRR}, volume = {abs/2202.13155}, year = {2022}, url = {https://arxiv.org/abs/2202.13155}, eprinttype = {arXiv}, eprint = {2202.13155}, timestamp = {Wed, 02 Mar 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2202-13155.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2203-00006, author = {Samuel Thomas and Hong{-}Kwang Jeff Kuo and Brian Kingsbury and George Saon}, title = {Towards Reducing the Need for Speech Training Data To Build Spoken Language Understanding Systems}, journal = {CoRR}, volume = {abs/2203.00006}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2203.00006}, doi = {10.48550/ARXIV.2203.00006}, eprinttype = {arXiv}, eprint = {2203.00006}, timestamp = {Wed, 16 Mar 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2203-00006.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2203-15176, author = {Xiaodong Cui and George Saon and Tohru Nagano and Masayuki Suzuki and Takashi Fukuda and Brian Kingsbury and Gakuto Kurata}, title = {Improving Generalization of Deep Neural Network Acoustic Models with Length Perturbation and N-best Based Label Smoothing}, journal = {CoRR}, volume = {abs/2203.15176}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2203.15176}, doi = {10.48550/ARXIV.2203.15176}, eprinttype = {arXiv}, eprint = {2203.15176}, timestamp = {Mon, 04 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2203-15176.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2204-00212, author = {Takuma Udagawa and Masayuki Suzuki and Gakuto Kurata and Nobuyasu Itoh and George Saon}, title = {Effect and Analysis of Large-scale Language Model Rescoring on Competitive {ASR} Systems}, journal = {CoRR}, volume = {abs/2204.00212}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2204.00212}, doi = {10.48550/ARXIV.2204.00212}, eprinttype = {arXiv}, eprint = {2204.00212}, timestamp = {Wed, 06 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2204-00212.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2206-07882, author = {Andrea Fasoli and Chia{-}Yu Chen and Mauricio J. Serrano and Swagath Venkataramani and George Saon and Xiaodong Cui and Brian Kingsbury and Kailash Gopalakrishnan}, title = {Accelerating Inference and Language Model Fusion of Recurrent Neural Network Transducers via End-to-End 4-bit Quantization}, journal = {CoRR}, volume = {abs/2206.07882}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2206.07882}, doi = {10.48550/ARXIV.2206.07882}, eprinttype = {arXiv}, eprint = {2206.07882}, timestamp = {Tue, 21 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2206-07882.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2207-13965, author = {Zvi Kons and Hagai Aronowitz and Edmilson da Silva Morais and Matheus Damasceno and Hong{-}Kwang Kuo and Samuel Thomas and George Saon}, title = {Extending RNN-T-based speech recognition systems with emotion and language classification}, journal = {CoRR}, volume = {abs/2207.13965}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2207.13965}, doi = {10.48550/ARXIV.2207.13965}, eprinttype = {arXiv}, eprint = {2207.13965}, timestamp = {Tue, 02 Aug 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2207-13965.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2208-01818, author = {Jiatong Shi and George Saon and David Haws and Shinji Watanabe and Brian Kingsbury}, title = {{VQ-T:} {RNN} Transducers using Vector-Quantized Prediction Network States}, journal = {CoRR}, volume = {abs/2208.01818}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2208.01818}, doi = {10.48550/ARXIV.2208.01818}, eprinttype = {arXiv}, eprint = {2208.01818}, timestamp = {Tue, 21 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2208-01818.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/taslp/CuiZKLFKSK21, author = {Xiaodong Cui and Wei Zhang and Abdullah Kayi and Mingrui Liu and Ulrich Finkler and Brian Kingsbury and George Saon and David S. Kung}, title = {Asynchronous Decentralized Distributed Training of Acoustic Models}, journal = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.}, volume = {29}, pages = {3565--3576}, year = {2021}, url = {https://doi.org/10.1109/TASLP.2021.3122349}, doi = {10.1109/TASLP.2021.3122349}, timestamp = {Sat, 25 Dec 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/taslp/CuiZKLFKSK21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/SaonTBK21, author = {George Saon and Zolt{\'{a}}n T{\"{u}}ske and Daniel Bola{\~{n}}os and Brian Kingsbury}, title = {Advancing {RNN} Transducer Technology for Speech Recognition}, booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing, {ICASSP} 2021, Toronto, ON, Canada, June 6-11, 2021}, pages = {5654--5658}, publisher = {{IEEE}}, year = {2021}, url = {https://doi.org/10.1109/ICASSP39728.2021.9414716}, doi = {10.1109/ICASSP39728.2021.9414716}, timestamp = {Fri, 09 Jul 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/SaonTBK21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/0001KSTKKKH21, author = {Samuel Thomas and Hong{-}Kwang Jeff Kuo and George Saon and Zolt{\'{a}}n T{\"{u}}ske and Brian Kingsbury and Gakuto Kurata and Zvi Kons and Ron Hoory}, title = {{RNN} Transducer Models for Spoken Language Understanding}, booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing, {ICASSP} 2021, Toronto, ON, Canada, June 6-11, 2021}, pages = {7493--7497}, publisher = {{IEEE}}, year = {2021}, url = {https://doi.org/10.1109/ICASSP39728.2021.9414029}, doi = {10.1109/ICASSP39728.2021.9414029}, timestamp = {Fri, 09 Jul 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/0001KSTKKKH21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/Ganhotra0KJSTK21, author = {Jatin Ganhotra and Samuel Thomas and Hong{-}Kwang Jeff Kuo and Sachindra Joshi and George Saon and Zolt{\'{a}}n T{\"{u}}ske and Brian Kingsbury}, editor = {Hynek Hermansky and Honza Cernock{\'{y}} and Luk{\'{a}}s Burget and Lori Lamel and Odette Scharenborg and Petr Motl{\'{\i}}cek}, title = {Integrating Dialog History into End-to-End Spoken Language Understanding Systems}, booktitle = {22nd Annual Conference of the International Speech Communication Association, Interspeech 2021, Brno, Czechia, August 30 - September 3, 2021}, pages = {1254--1258}, publisher = {{ISCA}}, year = {2021}, url = {https://doi.org/10.21437/Interspeech.2021-1460}, doi = {10.21437/INTERSPEECH.2021-1460}, timestamp = {Tue, 11 Jun 2024 16:45:43 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/Ganhotra0KJSTK21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/CuiKSHT21, author = {Xiaodong Cui and Brian Kingsbury and George Saon and David Haws and Zolt{\'{a}}n T{\"{u}}ske}, editor = {Hynek Hermansky and Honza Cernock{\'{y}} and Luk{\'{a}}s Burget and Lori Lamel and Odette Scharenborg and Petr Motl{\'{\i}}cek}, title = {Reducing Exposure Bias in Training Recurrent Neural Network Transducers}, booktitle = {22nd Annual Conference of the International Speech Communication Association, Interspeech 2021, Brno, Czechia, August 30 - September 3, 2021}, pages = {1802--1806}, publisher = {{ISCA}}, year = {2021}, url = {https://doi.org/10.21437/Interspeech.2021-587}, doi = {10.21437/INTERSPEECH.2021-587}, timestamp = {Wed, 21 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/CuiKSHT21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/KurataSKHT21, author = {Gakuto Kurata and George Saon and Brian Kingsbury and David Haws and Zolt{\'{a}}n T{\"{u}}ske}, editor = {Hynek Hermansky and Honza Cernock{\'{y}} and Luk{\'{a}}s Burget and Lori Lamel and Odette Scharenborg and Petr Motl{\'{\i}}cek}, title = {Improving Customization of Neural Transducers by Mitigating Acoustic Mismatch of Synthesized Audio}, booktitle = {22nd Annual Conference of the International Speech Communication Association, Interspeech 2021, Brno, Czechia, August 30 - September 3, 2021}, pages = {2027--2031}, publisher = {{ISCA}}, year = {2021}, url = {https://doi.org/10.21437/Interspeech.2021-1656}, doi = {10.21437/INTERSPEECH.2021-1656}, timestamp = {Wed, 21 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/KurataSKHT21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/TuskeSK21, author = {Zolt{\'{a}}n T{\"{u}}ske and George Saon and Brian Kingsbury}, editor = {Hynek Hermansky and Honza Cernock{\'{y}} and Luk{\'{a}}s Burget and Lori Lamel and Odette Scharenborg and Petr Motl{\'{\i}}cek}, title = {On the Limit of English Conversational Speech Recognition}, booktitle = {22nd Annual Conference of the International Speech Communication Association, Interspeech 2021, Brno, Czechia, August 30 - September 3, 2021}, pages = {2062--2066}, publisher = {{ISCA}}, year = {2021}, url = {https://doi.org/10.21437/Interspeech.2021-211}, doi = {10.21437/INTERSPEECH.2021-211}, timestamp = {Wed, 21 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/TuskeSK21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/FasoliCSSWVSCK021, author = {Andrea Fasoli and Chia{-}Yu Chen and Mauricio J. Serrano and Xiao Sun and Naigang Wang and Swagath Venkataramani and George Saon and Xiaodong Cui and Brian Kingsbury and Wei Zhang and Zolt{\'{a}}n T{\"{u}}ske and Kailash Gopalakrishnan}, editor = {Hynek Hermansky and Honza Cernock{\'{y}} and Luk{\'{a}}s Burget and Lori Lamel and Odette Scharenborg and Petr Motl{\'{\i}}cek}, title = {4-Bit Quantization of LSTM-Based Speech Recognition Models}, booktitle = {22nd Annual Conference of the International Speech Communication Association, Interspeech 2021, Brno, Czechia, August 30 - September 3, 2021}, pages = {2586--2590}, publisher = {{ISCA}}, year = {2021}, url = {https://doi.org/10.21437/Interspeech.2021-1962}, doi = {10.21437/INTERSPEECH.2021-1962}, timestamp = {Sat, 19 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/FasoliCSSWVSCK021.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2103-09935, author = {George Saon and Zolt{\'{a}}n T{\"{u}}ske and Daniel Bola{\~{n}}os and Brian Kingsbury}, title = {Advancing {RNN} Transducer Technology for Speech Recognition}, journal = {CoRR}, volume = {abs/2103.09935}, year = {2021}, url = {https://arxiv.org/abs/2103.09935}, eprinttype = {arXiv}, eprint = {2103.09935}, timestamp = {Tue, 23 Mar 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2103-09935.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2104-03842, author = {Samuel Thomas and Hong{-}Kwang Jeff Kuo and George Saon and Zolt{\'{a}}n T{\"{u}}ske and Brian Kingsbury and Gakuto Kurata and Zvi Kons and Ron Hoory}, title = {{RNN} Transducer Models For Spoken Language Understanding}, journal = {CoRR}, volume = {abs/2104.03842}, year = {2021}, url = {https://arxiv.org/abs/2104.03842}, eprinttype = {arXiv}, eprint = {2104.03842}, timestamp = {Tue, 13 Apr 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2104-03842.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2105-00982, author = {Zolt{\'{a}}n T{\"{u}}ske and George Saon and Brian Kingsbury}, title = {On the limit of English conversational speech recognition}, journal = {CoRR}, volume = {abs/2105.00982}, year = {2021}, url = {https://arxiv.org/abs/2105.00982}, eprinttype = {arXiv}, eprint = {2105.00982}, timestamp = {Wed, 12 May 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2105-00982.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2108-08405, author = {Jatin Ganhotra and Samuel Thomas and Hong{-}Kwang Jeff Kuo and Sachindra Joshi and George Saon and Zolt{\'{a}}n T{\"{u}}ske and Brian Kingsbury}, title = {Integrating Dialog History into End-to-End Spoken Language Understanding Systems}, journal = {CoRR}, volume = {abs/2108.08405}, year = {2021}, url = {https://arxiv.org/abs/2108.08405}, eprinttype = {arXiv}, eprint = {2108.08405}, timestamp = {Mon, 23 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2108-08405.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2108-10803, author = {Xiaodong Cui and Brian Kingsbury and George Saon and David Haws and Zolt{\'{a}}n T{\"{u}}ske}, title = {Reducing Exposure Bias in Training Recurrent Neural Network Transducers}, journal = {CoRR}, volume = {abs/2108.10803}, year = {2021}, url = {https://arxiv.org/abs/2108.10803}, eprinttype = {arXiv}, eprint = {2108.10803}, timestamp = {Fri, 27 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2108-10803.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2108-12074, author = {Andrea Fasoli and Chia{-}Yu Chen and Mauricio J. Serrano and Xiao Sun and Naigang Wang and Swagath Venkataramani and George Saon and Xiaodong Cui and Brian Kingsbury and Wei Zhang and Zolt{\'{a}}n T{\"{u}}ske and Kailash Gopalakrishnan}, title = {4-bit Quantization of LSTM-based Speech Recognition Models}, journal = {CoRR}, volume = {abs/2108.12074}, year = {2021}, url = {https://arxiv.org/abs/2108.12074}, eprinttype = {arXiv}, eprint = {2108.12074}, timestamp = {Tue, 14 Dec 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2108-12074.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2110-02743, author = {Thomas Bohnstingl and Ayush Garg and Stanislaw Wozniak and George Saon and Evangelos Eleftheriou and Angeliki Pantazi}, title = {Towards efficient end-to-end speech recognition with biologically-inspired neural networks}, journal = {CoRR}, volume = {abs/2110.02743}, year = {2021}, url = {https://arxiv.org/abs/2110.02743}, eprinttype = {arXiv}, eprint = {2110.02743}, timestamp = {Fri, 05 Nov 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2110-02743.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2110-11199, author = {Xiaodong Cui and Wei Zhang and Abdullah Kayi and Mingrui Liu and Ulrich Finkler and Brian Kingsbury and George Saon and David S. Kung}, title = {Asynchronous Decentralized Distributed Training of Acoustic Models}, journal = {CoRR}, volume = {abs/2110.11199}, year = {2021}, url = {https://arxiv.org/abs/2110.11199}, eprinttype = {arXiv}, eprint = {2110.11199}, timestamp = {Thu, 28 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2110-11199.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/spm/CuiZFSPK20, author = {Xiaodong Cui and Wei Zhang and Ulrich Finkler and George Saon and Michael Picheny and David S. Kung}, title = {Distributed Training of Deep Neural Network Acoustic Models for Automatic Speech Recognition: {A} comparison of current training strategies}, journal = {{IEEE} Signal Process. Mag.}, volume = {37}, number = {3}, pages = {39--49}, year = {2020}, url = {https://doi.org/10.1109/MSP.2020.2969859}, doi = {10.1109/MSP.2020.2969859}, timestamp = {Wed, 23 Sep 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/spm/CuiZFSPK20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/ZhangCKLFKSMBDK20, author = {Wei Zhang and Xiaodong Cui and Abdullah Kayi and Mingrui Liu and Ulrich Finkler and Brian Kingsbury and George Saon and Youssef Mroueh and Alper Buyuktosunoglu and Payel Das and David S. Kung and Michael Picheny}, title = {Improving Efficiency in Large-Scale Decentralized Distributed Training}, booktitle = {2020 {IEEE} International Conference on Acoustics, Speech and Signal Processing, {ICASSP} 2020, Barcelona, Spain, May 4-8, 2020}, pages = {3022--3026}, publisher = {{IEEE}}, year = {2020}, url = {https://doi.org/10.1109/ICASSP40776.2020.9054065}, doi = {10.1109/ICASSP40776.2020.9054065}, timestamp = {Wed, 23 Sep 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/ZhangCKLFKSMBDK20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/SaonTA20, author = {George Saon and Zolt{\'{a}}n T{\"{u}}ske and Kartik Audhkhasi}, title = {Alignment-Length Synchronous Decoding for {RNN} Transducer}, booktitle = {2020 {IEEE} International Conference on Acoustics, Speech and Signal Processing, {ICASSP} 2020, Barcelona, Spain, May 4-8, 2020}, pages = {7804--7808}, publisher = {{IEEE}}, year = {2020}, url = {https://doi.org/10.1109/ICASSP40776.2020.9053040}, doi = {10.1109/ICASSP40776.2020.9053040}, timestamp = {Thu, 23 Jul 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/SaonTA20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/TuskeSAK20, author = {Zolt{\'{a}}n T{\"{u}}ske and George Saon and Kartik Audhkhasi and Brian Kingsbury}, editor = {Helen Meng and Bo Xu and Thomas Fang Zheng}, title = {Single Headed Attention Based Sequence-to-Sequence Model for State-of-the-Art Results on Switchboard}, booktitle = {21st Annual Conference of the International Speech Communication Association, Interspeech 2020, Virtual Event, Shanghai, China, October 25-29, 2020}, pages = {551--555}, publisher = {{ISCA}}, year = {2020}, url = {https://doi.org/10.21437/Interspeech.2020-1488}, doi = {10.21437/INTERSPEECH.2020-1488}, timestamp = {Tue, 11 Jun 2024 16:45:43 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/TuskeSAK20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/KurataS20, author = {Gakuto Kurata and George Saon}, editor = {Helen Meng and Bo Xu and Thomas Fang Zheng}, title = {Knowledge Distillation from Offline to Streaming {RNN} Transducer for End-to-End Speech Recognition}, booktitle = {21st Annual Conference of the International Speech Communication Association, Interspeech 2020, Virtual Event, Shanghai, China, October 25-29, 2020}, pages = {2117--2121}, publisher = {{ISCA}}, year = {2020}, url = {https://doi.org/10.21437/Interspeech.2020-2442}, doi = {10.21437/INTERSPEECH.2020-2442}, timestamp = {Fri, 29 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/interspeech/KurataS20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2001-07263, author = {Zolt{\'{a}}n T{\"{u}}ske and George Saon and Kartik Audhkhasi and Brian Kingsbury}, title = {Single headed attention based sequence-to-sequence model for state-of-the-art results on Switchboard-300}, journal = {CoRR}, volume = {abs/2001.07263}, year = {2020}, url = {https://arxiv.org/abs/2001.07263}, eprinttype = {arXiv}, eprint = {2001.07263}, timestamp = {Fri, 24 Jan 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2001-07263.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2002-01119, author = {Wei Zhang and Xiaodong Cui and Abdullah Kayi and Mingrui Liu and Ulrich Finkler and Brian Kingsbury and George Saon and Youssef Mroueh and Alper Buyuktosunoglu and Payel Das and David S. Kung and Michael Picheny}, title = {Improving Efficiency in Large-Scale Decentralized Distributed Training}, journal = {CoRR}, volume = {abs/2002.01119}, year = {2020}, url = {https://arxiv.org/abs/2002.01119}, eprinttype = {arXiv}, eprint = {2002.01119}, timestamp = {Wed, 23 Sep 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2002-01119.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2002-10502, author = {Xiaodong Cui and Wei Zhang and Ulrich Finkler and George Saon and Michael Picheny and David S. Kung}, title = {Distributed Training of Deep Neural Network Acoustic Models for Automatic Speech Recognition}, journal = {CoRR}, volume = {abs/2002.10502}, year = {2020}, url = {https://arxiv.org/abs/2002.10502}, eprinttype = {arXiv}, eprint = {2002.10502}, timestamp = {Wed, 23 Sep 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2002-10502.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/asru/SaonTAKPT19, author = {George Saon and Zolt{\'{a}}n T{\"{u}}ske and Kartik Audhkhasi and Brian Kingsbury and Michael Picheny and Samuel Thomas}, title = {Simplified {LSTMS} for Speech Recognition}, booktitle = {{IEEE} Automatic Speech Recognition and Understanding Workshop, {ASRU} 2019, Singapore, December 14-18, 2019}, pages = {547--553}, publisher = {{IEEE}}, year = {2019}, url = {https://doi.org/10.1109/ASRU46091.2019.9003898}, doi = {10.1109/ASRU46091.2019.9003898}, timestamp = {Fri, 03 Jul 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/asru/SaonTAKPT19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/ZhangCFKSKP19, author = {Wei Zhang and Xiaodong Cui and Ulrich Finkler and Brian Kingsbury and George Saon and David S. Kung and Michael Picheny}, title = {Distributed Deep Learning Strategies for Automatic Speech Recognition}, booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing, {ICASSP} 2019, Brighton, United Kingdom, May 12-17, 2019}, pages = {5706--5710}, publisher = {{IEEE}}, year = {2019}, url = {https://doi.org/10.1109/ICASSP.2019.8682888}, doi = {10.1109/ICASSP.2019.8682888}, timestamp = {Wed, 23 Sep 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/ZhangCFKSKP19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/SaonTAK19, author = {George Saon and Zolt{\'{a}}n T{\"{u}}ske and Kartik Audhkhasi and Brian Kingsbury}, title = {Sequence Noise Injected Training for End-to-end Speech Recognition}, booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing, {ICASSP} 2019, Brighton, United Kingdom, May 12-17, 2019}, pages = {6261--6265}, publisher = {{IEEE}}, year = {2019}, url = {https://doi.org/10.1109/ICASSP.2019.8683706}, doi = {10.1109/ICASSP.2019.8683706}, timestamp = {Sun, 30 Jun 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/SaonTAK19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/ThomasSHKTSKPDK19, author = {Samuel Thomas and Masayuki Suzuki and Yinghui Huang and Gakuto Kurata and Zolt{\'{a}}n T{\"{u}}ske and George Saon and Brian Kingsbury and Michael Picheny and Tom Dibert and Alice Kaiser{-}Schatzlein and Bern Samko}, title = {English Broadcast News Speech Recognition by Humans and Machines}, booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing, {ICASSP} 2019, Brighton, United Kingdom, May 12-17, 2019}, pages = {6455--6459}, publisher = {{IEEE}}, year = {2019}, url = {https://doi.org/10.1109/ICASSP.2019.8683211}, doi = {10.1109/ICASSP.2019.8683211}, timestamp = {Fri, 03 Jul 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/ThomasSHKTSKPDK19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/PichenyTKACS19, author = {Michael Picheny and Zolt{\'{a}}n T{\"{u}}ske and Brian Kingsbury and Kartik Audhkhasi and Xiaodong Cui and George Saon}, editor = {Gernot Kubin and Zdravko Kacic}, title = {Challenging the Boundaries of Speech Recognition: The {MALACH} Corpus}, booktitle = {20th Annual Conference of the International Speech Communication Association, Interspeech 2019, Graz, Austria, September 15-19, 2019}, pages = {326--330}, publisher = {{ISCA}}, year = {2019}, url = {https://doi.org/10.21437/Interspeech.2019-1907}, doi = {10.21437/INTERSPEECH.2019-1907}, timestamp = {Tue, 11 Jun 2024 16:45:43 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/PichenyTKACS19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/AudhkhasiSTKP19, author = {Kartik Audhkhasi and George Saon and Zolt{\'{a}}n T{\"{u}}ske and Brian Kingsbury and Michael Picheny}, editor = {Gernot Kubin and Zdravko Kacic}, title = {Forget a Bit to Learn Better: Soft Forgetting for CTC-Based Automatic Speech Recognition}, booktitle = {20th Annual Conference of the International Speech Communication Association, Interspeech 2019, Graz, Austria, September 15-19, 2019}, pages = {2618--2622}, publisher = {{ISCA}}, year = {2019}, url = {https://doi.org/10.21437/Interspeech.2019-2841}, doi = {10.21437/INTERSPEECH.2019-2841}, timestamp = {Fri, 29 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/interspeech/AudhkhasiSTKP19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/ZhangCFSKBK0P19, author = {Wei Zhang and Xiaodong Cui and Ulrich Finkler and George Saon and Abdullah Kayi and Alper Buyuktosunoglu and Brian Kingsbury and David S. Kung and Michael Picheny}, editor = {Gernot Kubin and Zdravko Kacic}, title = {A Highly Efficient Distributed Deep Learning System for Automatic Speech Recognition}, booktitle = {20th Annual Conference of the International Speech Communication Association, Interspeech 2019, Graz, Austria, September 15-19, 2019}, pages = {2628--2632}, publisher = {{ISCA}}, year = {2019}, url = {https://doi.org/10.21437/Interspeech.2019-2700}, doi = {10.21437/INTERSPEECH.2019-2700}, timestamp = {Fri, 29 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/interspeech/ZhangCFSKBK0P19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/TuskeAS19, author = {Zolt{\'{a}}n T{\"{u}}ske and Kartik Audhkhasi and George Saon}, editor = {Gernot Kubin and Zdravko Kacic}, title = {Advancing Sequence-to-Sequence Based Speech Recognition}, booktitle = {20th Annual Conference of the International Speech Communication Association, Interspeech 2019, Graz, Austria, September 15-19, 2019}, pages = {3780--3784}, publisher = {{ISCA}}, year = {2019}, url = {https://doi.org/10.21437/Interspeech.2019-3018}, doi = {10.21437/INTERSPEECH.2019-3018}, timestamp = {Fri, 29 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/interspeech/TuskeAS19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1904-04956, author = {Wei Zhang and Xiaodong Cui and Ulrich Finkler and Brian Kingsbury and George Saon and David S. Kung and Michael Picheny}, title = {Distributed Deep Learning Strategies For Automatic Speech Recognition}, journal = {CoRR}, volume = {abs/1904.04956}, year = {2019}, url = {http://arxiv.org/abs/1904.04956}, eprinttype = {arXiv}, eprint = {1904.04956}, timestamp = {Wed, 23 Sep 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1904-04956.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1904-13258, author = {Samuel Thomas and Masayuki Suzuki and Yinghui Huang and Gakuto Kurata and Zolt{\'{a}}n T{\"{u}}ske and George Saon and Brian Kingsbury and Michael Picheny and Tom Dibert and Alice Kaiser{-}Schatzlein and Bern Samko}, title = {English Broadcast News Speech Recognition by Humans and Machines}, journal = {CoRR}, volume = {abs/1904.13258}, year = {2019}, url = {http://arxiv.org/abs/1904.13258}, eprinttype = {arXiv}, eprint = {1904.13258}, timestamp = {Fri, 03 Jul 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1904-13258.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1907-05701, author = {Wei Zhang and Xiaodong Cui and Ulrich Finkler and George Saon and Abdullah Kayi and Alper Buyuktosunoglu and Brian Kingsbury and David S. Kung and Michael Picheny}, title = {A Highly Efficient Distributed Deep Learning System For Automatic Speech Recognition}, journal = {CoRR}, volume = {abs/1907.05701}, year = {2019}, url = {http://arxiv.org/abs/1907.05701}, eprinttype = {arXiv}, eprint = {1907.05701}, timestamp = {Wed, 23 Sep 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1907-05701.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1908-03455, author = {Michael Picheny and Zolt{\'{a}}n T{\"{u}}ske and Brian Kingsbury and Kartik Audhkhasi and Xiaodong Cui and George Saon}, title = {Challenging the Boundaries of Speech Recognition: The {MALACH} Corpus}, journal = {CoRR}, volume = {abs/1908.03455}, year = {2019}, url = {http://arxiv.org/abs/1908.03455}, eprinttype = {arXiv}, eprint = {1908.03455}, timestamp = {Mon, 19 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1908-03455.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/AudhkhasiKRSP18, author = {Kartik Audhkhasi and Brian Kingsbury and Bhuvana Ramabhadran and George Saon and Michael Picheny}, title = {Building Competitive Direct Acoustics-to-Word Models for English Conversational Speech Recognition}, booktitle = {2018 {IEEE} International Conference on Acoustics, Speech and Signal Processing, {ICASSP} 2018, Calgary, AB, Canada, April 15-20, 2018}, pages = {4759--4763}, publisher = {{IEEE}}, year = {2018}, url = {https://doi.org/10.1109/ICASSP.2018.8461935}, doi = {10.1109/ICASSP.2018.8461935}, timestamp = {Wed, 16 Oct 2019 14:14:52 +0200}, biburl = {https://dblp.org/rec/conf/icassp/AudhkhasiKRSP18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ibmrd/SaonP17, author = {George Saon and Michael Picheny}, title = {Recent advances in conversational speech recognition using convolutional and recurrent neural networks}, journal = {{IBM} J. Res. Dev.}, volume = {61}, number = {4-5}, pages = {1:1--1:10}, year = {2017}, url = {https://doi.org/10.1147/JRD.2017.2701178}, doi = {10.1147/JRD.2017.2701178}, timestamp = {Sun, 08 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ibmrd/SaonP17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ibmrd/AudhkhasiRSSRCP17, author = {Kartik Audhkhasi and Andrew Rosenberg and George Saon and Abhinav Sethy and Bhuvana Ramabhadran and Stanley F. Chen and Michael Picheny}, title = {Recent progress in deep end-to-end models for spoken language processing}, journal = {{IBM} J. Res. Dev.}, volume = {61}, number = {4-5}, pages = {2:1--2:10}, year = {2017}, url = {https://doi.org/10.1147/JRD.2017.2701207}, doi = {10.1147/JRD.2017.2701207}, timestamp = {Sun, 08 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ibmrd/AudhkhasiRSSRCP17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/asru/KurataRSS17, author = {Gakuto Kurata and Bhuvana Ramabhadran and George Saon and Abhinav Sethy}, title = {Language modeling with highway {LSTM}}, booktitle = {2017 {IEEE} Automatic Speech Recognition and Understanding Workshop, {ASRU} 2017, Okinawa, Japan, December 16-20, 2017}, pages = {244--251}, publisher = {{IEEE}}, year = {2017}, url = {https://doi.org/10.1109/ASRU.2017.8268942}, doi = {10.1109/ASRU.2017.8268942}, timestamp = {Wed, 16 Oct 2019 14:14:51 +0200}, biburl = {https://dblp.org/rec/conf/asru/KurataRSS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/CuiKRSSASNR17, author = {Jia Cui and Brian Kingsbury and Bhuvana Ramabhadran and George Saon and Tom Sercu and Kartik Audhkhasi and Abhinav Sethy and Markus Nu{\ss}baum{-}Thom and Andrew Rosenberg}, title = {Knowledge distillation across ensembles of multilingual models for low-resource languages}, booktitle = {2017 {IEEE} International Conference on Acoustics, Speech and Signal Processing, {ICASSP} 2017, New Orleans, LA, USA, March 5-9, 2017}, pages = {4825--4829}, publisher = {{IEEE}}, year = {2017}, url = {https://doi.org/10.1109/ICASSP.2017.7953073}, doi = {10.1109/ICASSP.2017.7953073}, timestamp = {Wed, 16 Oct 2019 14:14:52 +0200}, biburl = {https://dblp.org/rec/conf/icassp/CuiKRSSASNR17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/SercuSCCRKS17, author = {Tom Sercu and George Saon and Jia Cui and Xiaodong Cui and Bhuvana Ramabhadran and Brian Kingsbury and Abhinav Sethy}, title = {Network architectures for multilingual speech representation learning}, booktitle = {2017 {IEEE} International Conference on Acoustics, Speech and Signal Processing, {ICASSP} 2017, New Orleans, LA, USA, March 5-9, 2017}, pages = {5295--5299}, publisher = {{IEEE}}, year = {2017}, url = {https://doi.org/10.1109/ICASSP.2017.7953167}, doi = {10.1109/ICASSP.2017.7953167}, timestamp = {Fri, 23 Jun 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/SercuSCCRKS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/CuiGS17, author = {Xiaodong Cui and Vaibhava Goel and George Saon}, editor = {Francisco Lacerda}, title = {Embedding-Based Speaker Adaptive Training of Deep Neural Networks}, booktitle = {18th Annual Conference of the International Speech Communication Association, Interspeech 2017, Stockholm, Sweden, August 20-24, 2017}, pages = {122--126}, publisher = {{ISCA}}, year = {2017}, url = {https://doi.org/10.21437/Interspeech.2017-460}, doi = {10.21437/INTERSPEECH.2017-460}, timestamp = {Tue, 11 Jun 2024 16:45:43 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/CuiGS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/SaonKSATDCRPLRH17, author = {George Saon and Gakuto Kurata and Tom Sercu and Kartik Audhkhasi and Samuel Thomas and Dimitrios Dimitriadis and Xiaodong Cui and Bhuvana Ramabhadran and Michael Picheny and Lynn{-}Li Lim and Bergul Roomi and Phil Hall}, editor = {Francisco Lacerda}, title = {English Conversational Telephone Speech Recognition by Humans and Machines}, booktitle = {18th Annual Conference of the International Speech Communication Association, Interspeech 2017, Stockholm, Sweden, August 20-24, 2017}, pages = {132--136}, publisher = {{ISCA}}, year = {2017}, url = {https://doi.org/10.21437/Interspeech.2017-405}, doi = {10.21437/INTERSPEECH.2017-405}, timestamp = {Mon, 26 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/SaonKSATDCRPLRH17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/KurataSRS17, author = {Gakuto Kurata and Abhinav Sethy and Bhuvana Ramabhadran and George Saon}, editor = {Francisco Lacerda}, title = {Empirical Exploration of Novel Architectures and Objectives for Language Models}, booktitle = {18th Annual Conference of the International Speech Communication Association, Interspeech 2017, Stockholm, Sweden, August 20-24, 2017}, pages = {279--283}, publisher = {{ISCA}}, year = {2017}, url = {https://doi.org/10.21437/Interspeech.2017-723}, doi = {10.21437/INTERSPEECH.2017-723}, timestamp = {Mon, 26 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/KurataSRS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/AudhkhasiRSPN17, author = {Kartik Audhkhasi and Bhuvana Ramabhadran and George Saon and Michael Picheny and David Nahamoo}, editor = {Francisco Lacerda}, title = {Direct Acoustics-to-Word Models for English Conversational Speech Recognition}, booktitle = {18th Annual Conference of the International Speech Communication Association, Interspeech 2017, Stockholm, Sweden, August 20-24, 2017}, pages = {959--963}, publisher = {{ISCA}}, year = {2017}, url = {https://doi.org/10.21437/Interspeech.2017-546}, doi = {10.21437/INTERSPEECH.2017-546}, timestamp = {Mon, 26 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/AudhkhasiRSPN17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sc/CongKGSZ17, author = {Guojing Cong and Brian Kingsbury and Soumyadip Gosh and George Saon and Fan Zhou}, title = {Accelerating deep neural network learning for speech recognition on a cluster of GPUs}, booktitle = {Proceedings of the Machine Learning on {HPC} Environments, MLHPC@SC 2017, Denver, CO, USA, November 13, 2017}, pages = {3:1--3:8}, publisher = {{ACM}}, year = {2017}, url = {https://doi.org/10.1145/3146347.3146351}, doi = {10.1145/3146347.3146351}, timestamp = {Tue, 13 Dec 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/sc/CongKGSZ17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/SaonKSATDCRPLRH17, author = {George Saon and Gakuto Kurata and Tom Sercu and Kartik Audhkhasi and Samuel Thomas and Dimitrios Dimitriadis and Xiaodong Cui and Bhuvana Ramabhadran and Michael Picheny and Lynn{-}Li Lim and Bergul Roomi and Phil Hall}, title = {English Conversational Telephone Speech Recognition by Humans and Machines}, journal = {CoRR}, volume = {abs/1703.02136}, year = {2017}, url = {http://arxiv.org/abs/1703.02136}, eprinttype = {arXiv}, eprint = {1703.02136}, timestamp = {Fri, 03 Jul 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/SaonKSATDCRPLRH17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/AudhkhasiRSPN17, author = {Kartik Audhkhasi and Bhuvana Ramabhadran and George Saon and Michael Picheny and David Nahamoo}, title = {Direct Acoustics-to-Word Models for English Conversational Speech Recognition}, journal = {CoRR}, volume = {abs/1703.07754}, year = {2017}, url = {http://arxiv.org/abs/1703.07754}, eprinttype = {arXiv}, eprint = {1703.07754}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/AudhkhasiRSPN17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1709-06436, author = {Gakuto Kurata and Bhuvana Ramabhadran and George Saon and Abhinav Sethy}, title = {Language Modeling with Highway {LSTM}}, journal = {CoRR}, volume = {abs/1709.06436}, year = {2017}, url = {http://arxiv.org/abs/1709.06436}, eprinttype = {arXiv}, eprint = {1709.06436}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1709-06436.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1710-06937, author = {Xiaodong Cui and Vaibhava Goel and George Saon}, title = {Embedding-Based Speaker Adaptive Training of Deep Neural Networks}, journal = {CoRR}, volume = {abs/1710.06937}, year = {2017}, url = {http://arxiv.org/abs/1710.06937}, eprinttype = {arXiv}, eprint = {1710.06937}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1710-06937.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1712-03133, author = {Kartik Audhkhasi and Brian Kingsbury and Bhuvana Ramabhadran and George Saon and Michael Picheny}, title = {Building competitive direct acoustics-to-word models for English conversational speech recognition}, journal = {CoRR}, volume = {abs/1712.03133}, year = {2017}, url = {http://arxiv.org/abs/1712.03133}, eprinttype = {arXiv}, eprint = {1712.03133}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1712-03133.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/HawsDSTP16, author = {David Haws and Dimitrios Dimitriadis and George Saon and Samuel Thomas and Michael Picheny}, title = {On the importance of event detection for {ASR}}, booktitle = {2016 {IEEE} International Conference on Acoustics, Speech and Signal Processing, {ICASSP} 2016, Shanghai, China, March 20-25, 2016}, pages = {5705--5709}, publisher = {{IEEE}}, year = {2016}, url = {https://doi.org/10.1109/ICASSP.2016.7472770}, doi = {10.1109/ICASSP.2016.7472770}, timestamp = {Fri, 03 Jul 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/HawsDSTP16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/SaonSRK16, author = {George Saon and Tom Sercu and Steven J. Rennie and Hong{-}Kwang Jeff Kuo}, editor = {Nelson Morgan}, title = {The {IBM} 2016 English Conversational Telephone Speech Recognition System}, booktitle = {17th Annual Conference of the International Speech Communication Association, Interspeech 2016, San Francisco, CA, USA, September 8-12, 2016}, pages = {7--11}, publisher = {{ISCA}}, year = {2016}, url = {https://doi.org/10.21437/Interspeech.2016-1460}, doi = {10.21437/INTERSPEECH.2016-1460}, timestamp = {Tue, 11 Jun 2024 16:45:43 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/SaonSRK16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/SuzukiTTRS16, author = {Masayuki Suzuki and Ryuki Tachibana and Samuel Thomas and Bhuvana Ramabhadran and George Saon}, editor = {Nelson Morgan}, title = {Domain Adaptation of {CNN} Based Acoustic Models Under Limited Resource Settings}, booktitle = {17th Annual Conference of the International Speech Communication Association, Interspeech 2016, San Francisco, CA, USA, September 8-12, 2016}, pages = {1588--1592}, publisher = {{ISCA}}, year = {2016}, url = {https://doi.org/10.21437/Interspeech.2016-1161}, doi = {10.21437/INTERSPEECH.2016-1161}, timestamp = {Fri, 29 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/interspeech/SuzukiTTRS16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/SaonSRK16, author = {George Saon and Tom Sercu and Steven J. Rennie and Hong{-}Kwang Jeff Kuo}, title = {The {IBM} 2016 English Conversational Telephone Speech Recognition System}, journal = {CoRR}, volume = {abs/1604.08242}, year = {2016}, url = {http://arxiv.org/abs/1604.08242}, eprinttype = {arXiv}, eprint = {1604.08242}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/SaonSRK16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/nn/SainathKSSMDR15, author = {Tara N. Sainath and Brian Kingsbury and George Saon and Hagen Soltau and Abdel{-}rahman Mohamed and George E. Dahl and Bhuvana Ramabhadran}, title = {Deep Convolutional Neural Networks for Large-scale Speech Tasks}, journal = {Neural Networks}, volume = {64}, pages = {39--48}, year = {2015}, url = {https://doi.org/10.1016/j.neunet.2014.08.005}, doi = {10.1016/J.NEUNET.2014.08.005}, timestamp = {Wed, 14 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/nn/SainathKSSMDR15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/ThomasSSN15, author = {Samuel Thomas and George Saon and Maarten Van Segbroeck and Shrikanth S. Narayanan}, title = {Improvements to the {IBM} speech activity detection system for the {DARPA} {RATS} program}, booktitle = {2015 {IEEE} International Conference on Acoustics, Speech and Signal Processing, {ICASSP} 2015, South Brisbane, Queensland, Australia, April 19-24, 2015}, pages = {4500--4504}, publisher = {{IEEE}}, year = {2015}, url = {https://doi.org/10.1109/ICASSP.2015.7178822}, doi = {10.1109/ICASSP.2015.7178822}, timestamp = {Fri, 03 Jul 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/ThomasSSN15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/KeskarS15, author = {Nitish Shirish Keskar and George Saon}, title = {A nonmonotone learning rate strategy for {SGD} training of deep neural networks}, booktitle = {2015 {IEEE} International Conference on Acoustics, Speech and Signal Processing, {ICASSP} 2015, South Brisbane, Queensland, Australia, April 19-24, 2015}, pages = {4974--4978}, publisher = {{IEEE}}, year = {2015}, url = {https://doi.org/10.1109/ICASSP.2015.7178917}, doi = {10.1109/ICASSP.2015.7178917}, timestamp = {Fri, 19 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/KeskarS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/ManguSPK15, author = {Lidia Mangu and George Saon and Michael Picheny and Brian Kingsbury}, title = {Order-free spoken term detection}, booktitle = {2015 {IEEE} International Conference on Acoustics, Speech and Signal Processing, {ICASSP} 2015, South Brisbane, Queensland, Australia, April 19-24, 2015}, pages = {5331--5335}, publisher = {{IEEE}}, year = {2015}, url = {https://doi.org/10.1109/ICASSP.2015.7178989}, doi = {10.1109/ICASSP.2015.7178989}, timestamp = {Fri, 19 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/ManguSPK15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/SaonKRP15, author = {George Saon and Hong{-}Kwang Jeff Kuo and Steven J. Rennie and Michael Picheny}, title = {The {IBM} 2015 English conversational telephone speech recognition system}, booktitle = {16th Annual Conference of the International Speech Communication Association, {INTERSPEECH} 2015, Dresden, Germany, September 6-10, 2015}, pages = {3140--3144}, publisher = {{ISCA}}, year = {2015}, url = {https://doi.org/10.21437/Interspeech.2015-632}, doi = {10.21437/INTERSPEECH.2015-632}, timestamp = {Tue, 11 Jun 2024 16:45:43 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/SaonKRP15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/ThomasSKM15, author = {Samuel Thomas and George Saon and Hong{-}Kwang Jeff Kuo and Lidia Mangu}, title = {The {IBM} {BOLT} speech transcription system}, booktitle = {16th Annual Conference of the International Speech Communication Association, {INTERSPEECH} 2015, Dresden, Germany, September 6-10, 2015}, pages = {3150--3153}, publisher = {{ISCA}}, year = {2015}, url = {https://doi.org/10.21437/Interspeech.2015-634}, doi = {10.21437/INTERSPEECH.2015-634}, timestamp = {Fri, 23 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/ThomasSKM15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/CuiSRK15, author = {Jia Cui and George Saon and Bhuvana Ramabhadran and Brian Kingsbury}, title = {A multi-region deep neural network model in speech recognition}, booktitle = {16th Annual Conference of the International Speech Communication Association, {INTERSPEECH} 2015, Dresden, Germany, September 6-10, 2015}, pages = {3244--3248}, publisher = {{ISCA}}, year = {2015}, url = {https://doi.org/10.21437/Interspeech.2015-653}, doi = {10.21437/INTERSPEECH.2015-653}, timestamp = {Fri, 23 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/CuiSRK15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/SaonKRP15, author = {George Saon and Hong{-}Kwang Jeff Kuo and Steven J. Rennie and Michael Picheny}, title = {The {IBM} 2015 English Conversational Telephone Speech Recognition System}, journal = {CoRR}, volume = {abs/1505.05899}, year = {2015}, url = {http://arxiv.org/abs/1505.05899}, eprinttype = {arXiv}, eprint = {1505.05899}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/SaonKRP15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/ThomasGSS14, author = {Samuel Thomas and Sriram Ganapathy and George Saon and Hagen Soltau}, title = {Analyzing convolutional neural networks for speech activity detection in mismatched acoustic conditions}, booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing, {ICASSP} 2014, Florence, Italy, May 4-9, 2014}, pages = {2519--2523}, publisher = {{IEEE}}, year = {2014}, url = {https://doi.org/10.1109/ICASSP.2014.6854054}, doi = {10.1109/ICASSP.2014.6854054}, timestamp = {Fri, 03 Jul 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/ThomasGSS14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/SaonS14, author = {George Saon and Hagen Soltau}, title = {A comparison of two optimization techniques for sequence discriminative training of deep neural networks}, booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing, {ICASSP} 2014, Florence, Italy, May 4-9, 2014}, pages = {5567--5571}, publisher = {{IEEE}}, year = {2014}, url = {https://doi.org/10.1109/ICASSP.2014.6854668}, doi = {10.1109/ICASSP.2014.6854668}, timestamp = {Fri, 19 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/SaonS14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/SoltauSS14, author = {Hagen Soltau and George Saon and Tara N. Sainath}, title = {Joint training of convolutional and non-convolutional neural networks}, booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing, {ICASSP} 2014, Florence, Italy, May 4-9, 2014}, pages = {5572--5576}, publisher = {{IEEE}}, year = {2014}, url = {https://doi.org/10.1109/ICASSP.2014.6854669}, doi = {10.1109/ICASSP.2014.6854669}, timestamp = {Fri, 19 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/SoltauSS14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/SainathKMSR14, author = {Tara N. Sainath and Brian Kingsbury and Abdel{-}rahman Mohamed and George Saon and Bhuvana Ramabhadran}, title = {Improvements to filterbank and delta learning within a deep neural network framework}, booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing, {ICASSP} 2014, Florence, Italy, May 4-9, 2014}, pages = {6839--6843}, publisher = {{IEEE}}, year = {2014}, url = {https://doi.org/10.1109/ICASSP.2014.6854925}, doi = {10.1109/ICASSP.2014.6854925}, timestamp = {Fri, 19 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/SainathKMSR14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/SaonSEP14, author = {George Saon and Hagen Soltau and Ahmad Emami and Michael Picheny}, editor = {Haizhou Li and Helen M. Meng and Bin Ma and Engsiong Chng and Lei Xie}, title = {Unfolded recurrent neural networks for speech recognition}, booktitle = {15th Annual Conference of the International Speech Communication Association, {INTERSPEECH} 2014, Singapore, September 14-18, 2014}, pages = {343--347}, publisher = {{ISCA}}, year = {2014}, url = {https://doi.org/10.21437/Interspeech.2014-81}, doi = {10.21437/INTERSPEECH.2014-81}, timestamp = {Tue, 11 Jun 2024 16:45:43 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/SaonSEP14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/SainathCRPGKSAC14, author = {Tara N. Sainath and I{-}Hsin Chung and Bhuvana Ramabhadran and Michael Picheny and John A. Gunnels and Brian Kingsbury and George Saon and Vernon Austel and Upendra V. Chaudhari}, editor = {Haizhou Li and Helen M. Meng and Bin Ma and Engsiong Chng and Lei Xie}, title = {Parallel deep neural network training for {LVCSR} tasks using blue gene/Q}, booktitle = {15th Annual Conference of the International Speech Communication Association, {INTERSPEECH} 2014, Singapore, September 14-18, 2014}, pages = {1048--1052}, publisher = {{ISCA}}, year = {2014}, url = {https://doi.org/10.21437/Interspeech.2014-272}, doi = {10.21437/INTERSPEECH.2014-272}, timestamp = {Fri, 23 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/SainathCRPGKSAC14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/slt/Saon14, author = {George Saon}, title = {A distributed architecture for fast {SGD} sequence discriminative training of {DNN} acoustic models}, booktitle = {2014 {IEEE} Spoken Language Technology Workshop, {SLT} 2014, South Lake Tahoe, NV, USA, December 7-10, 2014}, pages = {183--188}, publisher = {{IEEE}}, year = {2014}, url = {https://doi.org/10.1109/SLT.2014.7078571}, doi = {10.1109/SLT.2014.7078571}, timestamp = {Wed, 16 Oct 2019 14:14:53 +0200}, biburl = {https://dblp.org/rec/conf/slt/Saon14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@incollection{DBLP:series/tanlp/SoltauSMKKCB14, author = {Hagen Soltau and George Saon and Lidia Mangu and Hong{-}Kwang Kuo and Brian Kingsbury and Stephen M. Chu and Fadi Biadsy}, editor = {Imed Zitouni}, title = {Automatic Speech Recognition}, booktitle = {Natural Language Processing of Semitic Languages}, series = {Theory and Applications of Natural Language Processing}, pages = {409--459}, publisher = {Springer}, year = {2014}, url = {https://doi.org/10.1007/978-3-642-45358-8\_13}, doi = {10.1007/978-3-642-45358-8\_13}, timestamp = {Wed, 06 Mar 2019 11:14:32 +0100}, biburl = {https://dblp.org/rec/series/tanlp/SoltauSMKKCB14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/asru/SaonSNP13, author = {George Saon and Hagen Soltau and David Nahamoo and Michael Picheny}, title = {Speaker adaptation of neural network acoustic models using i-vectors}, booktitle = {2013 {IEEE} Workshop on Automatic Speech Recognition and Understanding, Olomouc, Czech Republic, December 8-12, 2013}, pages = {55--59}, publisher = {{IEEE}}, year = {2013}, url = {https://doi.org/10.1109/ASRU.2013.6707705}, doi = {10.1109/ASRU.2013.6707705}, timestamp = {Wed, 16 Oct 2019 14:14:51 +0200}, biburl = {https://dblp.org/rec/conf/asru/SaonSNP13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/asru/ManguSKS13, author = {Lidia Mangu and Hagen Soltau and Hong{-}Kwang Kuo and George Saon}, title = {The {IBM} keyword search system for the {DARPA} {RATS} program}, booktitle = {2013 {IEEE} Workshop on Automatic Speech Recognition and Understanding, Olomouc, Czech Republic, December 8-12, 2013}, pages = {204--209}, publisher = {{IEEE}}, year = {2013}, url = {https://doi.org/10.1109/ASRU.2013.6707730}, doi = {10.1109/ASRU.2013.6707730}, timestamp = {Fri, 26 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/asru/ManguSKS13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/asru/SainathKMDSSBAR13, author = {Tara N. Sainath and Brian Kingsbury and Abdel{-}rahman Mohamed and George E. Dahl and George Saon and Hagen Soltau and Tom{\'{a}}s Beran and Aleksandr Y. Aravkin and Bhuvana Ramabhadran}, title = {Improvements to Deep Convolutional Neural Networks for {LVCSR}}, booktitle = {2013 {IEEE} Workshop on Automatic Speech Recognition and Understanding, Olomouc, Czech Republic, December 8-12, 2013}, pages = {315--320}, publisher = {{IEEE}}, year = {2013}, url = {https://doi.org/10.1109/ASRU.2013.6707749}, doi = {10.1109/ASRU.2013.6707749}, timestamp = {Fri, 26 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/asru/SainathKMDSSBAR13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/ManguSKKS13, author = {Lidia Mangu and Hagen Soltau and Hong{-}Kwang Kuo and Brian Kingsbury and George Saon}, title = {Exploiting diversity for spoken term detection}, booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing, {ICASSP} 2013, Vancouver, BC, Canada, May 26-31, 2013}, pages = {8282--8286}, publisher = {{IEEE}}, year = {2013}, url = {https://doi.org/10.1109/ICASSP.2013.6639280}, doi = {10.1109/ICASSP.2013.6639280}, timestamp = {Wed, 16 Oct 2019 14:14:52 +0200}, biburl = {https://dblp.org/rec/conf/icassp/ManguSKKS13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/SoltauKMSB13, author = {Hagen Soltau and Hong{-}Kwang Kuo and Lidia Mangu and George Saon and Tom{\'{a}}s Beran}, editor = {Fr{\'{e}}d{\'{e}}ric Bimbot and Christophe Cerisara and C{\'{e}}cile Fougeron and Guillaume Gravier and Lori Lamel and Fran{\c{c}}ois Pellegrino and Pascal Perrier}, title = {Neural network acoustic models for the {DARPA} {RATS} program}, booktitle = {14th Annual Conference of the International Speech Communication Association, {INTERSPEECH} 2013, Lyon, France, August 25-29, 2013}, pages = {3092--3096}, publisher = {{ISCA}}, year = {2013}, url = {https://doi.org/10.21437/Interspeech.2013-674}, doi = {10.21437/INTERSPEECH.2013-674}, timestamp = {Tue, 11 Jun 2024 16:45:43 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/SoltauKMSB13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/SaonTSGK13, author = {George Saon and Samuel Thomas and Hagen Soltau and Sriram Ganapathy and Brian Kingsbury}, editor = {Fr{\'{e}}d{\'{e}}ric Bimbot and Christophe Cerisara and C{\'{e}}cile Fougeron and Guillaume Gravier and Lori Lamel and Fran{\c{c}}ois Pellegrino and Pascal Perrier}, title = {The {IBM} speech activity detection system for the {DARPA} {RATS} program}, booktitle = {14th Annual Conference of the International Speech Communication Association, {INTERSPEECH} 2013, Lyon, France, August 25-29, 2013}, pages = {3497--3501}, publisher = {{ISCA}}, year = {2013}, url = {https://doi.org/10.21437/Interspeech.2013-264}, doi = {10.21437/INTERSPEECH.2013-264}, timestamp = {Fri, 23 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/SaonTSGK13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/SainathKMDSSBAR13, author = {Tara N. Sainath and Brian Kingsbury and Abdel{-}rahman Mohamed and George E. Dahl and George Saon and Hagen Soltau and Tom{\'{a}}s Beran and Aleksandr Y. Aravkin and Bhuvana Ramabhadran}, title = {Improvements to deep convolutional neural networks for {LVCSR}}, journal = {CoRR}, volume = {abs/1309.1501}, year = {2013}, url = {http://arxiv.org/abs/1309.1501}, eprinttype = {arXiv}, eprint = {1309.1501}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/SainathKMDSSBAR13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/speech/SaonS12, author = {George Saon and Hagen Soltau}, title = {Boosting systems for large vocabulary continuous speech recognition}, journal = {Speech Commun.}, volume = {54}, number = {2}, pages = {212--218}, year = {2012}, url = {https://doi.org/10.1016/j.specom.2011.07.011}, doi = {10.1016/J.SPECOM.2011.07.011}, timestamp = {Sat, 22 Feb 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/speech/SaonS12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/spm/SaonC12, author = {George Saon and Jen{-}Tzung Chien}, title = {Large-Vocabulary Continuous Speech Recognition Systems: {A} Look at Some Recent Advances}, journal = {{IEEE} Signal Process. Mag.}, volume = {29}, number = {6}, pages = {18--33}, year = {2012}, url = {https://doi.org/10.1109/MSP.2012.2197156}, doi = {10.1109/MSP.2012.2197156}, timestamp = {Wed, 14 Jun 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/spm/SaonC12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/taslp/SaonC12, author = {George Saon and Jen{-}Tzung Chien}, title = {Bayesian Sensing Hidden Markov Models}, journal = {{IEEE} Trans. Speech Audio Process.}, volume = {20}, number = {1}, pages = {43--54}, year = {2012}, url = {https://doi.org/10.1109/TASL.2011.2129911}, doi = {10.1109/TASL.2011.2129911}, timestamp = {Sun, 17 May 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/taslp/SaonC12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/apsipa/SaonC12, author = {George Saon and Jen{-}Tzung Chien}, title = {Recent developments in large vocabulary continuous speech recognition}, booktitle = {Asia-Pacific Signal and Information Processing Association Annual Summit and Conference, {APSIPA} 2012, Hollywood, CA, USA, December 3-6, 2012}, pages = {1--6}, publisher = {{IEEE}}, year = {2012}, url = {https://ieeexplore.ieee.org/document/6411850/}, timestamp = {Sun, 08 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/apsipa/SaonC12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/SaonK12, author = {George Saon and Brian Kingsbury}, title = {Discriminative feature-space transforms using deep neural networks}, booktitle = {13th Annual Conference of the International Speech Communication Association, {INTERSPEECH} 2012, Portland, Oregon, USA, September 9-13, 2012}, pages = {14--17}, publisher = {{ISCA}}, year = {2012}, url = {https://doi.org/10.21437/Interspeech.2012-4}, doi = {10.21437/INTERSPEECH.2012-4}, timestamp = {Tue, 11 Jun 2024 16:45:43 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/SaonK12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/CuiASG12, author = {Xiaodong Cui and Mohamed Afify and George Saon and Vaibhava Goel}, title = {Sparse Bayesian Factor Analysis for Stereo-based Stochastic Mapping}, booktitle = {13th Annual Conference of the International Speech Communication Association, {INTERSPEECH} 2012, Portland, Oregon, USA, September 9-13, 2012}, pages = {795--798}, publisher = {{ISCA}}, year = {2012}, url = {https://doi.org/10.21437/Interspeech.2012-243}, doi = {10.21437/INTERSPEECH.2012-243}, timestamp = {Fri, 23 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/CuiASG12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ibmrd/PichenyNGKRRS11, author = {Michael Picheny and David Nahamoo and Vaibhava Goel and Brian Kingsbury and Bhuvana Ramabhadran and Steven J. Rennie and George Saon}, title = {Trends and advances in speech recognition}, journal = {{IBM} J. Res. Dev.}, volume = {55}, number = {5}, pages = {2}, year = {2011}, url = {https://doi.org/10.1147/JRD.2011.2163277}, doi = {10.1147/JRD.2011.2163277}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ibmrd/PichenyNGKRRS11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/asru/SaonC11, author = {George Saon and Jen{-}Tzung Chien}, editor = {David Nahamoo and Michael Picheny}, title = {Some properties of Bayesian sensing hidden Markov models}, booktitle = {2011 {IEEE} Workshop on Automatic Speech Recognition {\&} Understanding, {ASRU} 2011, Waikoloa, HI, USA, December 11-15, 2011}, pages = {65--70}, publisher = {{IEEE}}, year = {2011}, url = {https://doi.org/10.1109/ASRU.2011.6163907}, doi = {10.1109/ASRU.2011.6163907}, timestamp = {Wed, 16 Oct 2019 14:14:51 +0200}, biburl = {https://dblp.org/rec/conf/asru/SaonC11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/asru/KuoAMS11, author = {Hong{-}Kwang Jeff Kuo and Ebru Arisoy and Lidia Mangu and George Saon}, editor = {David Nahamoo and Michael Picheny}, title = {Minimum Bayes risk discriminative language models for Arabic speech recognition}, booktitle = {2011 {IEEE} Workshop on Automatic Speech Recognition {\&} Understanding, {ASRU} 2011, Waikoloa, HI, USA, December 11-15, 2011}, pages = {208--213}, publisher = {{IEEE}}, year = {2011}, url = {https://doi.org/10.1109/ASRU.2011.6163932}, doi = {10.1109/ASRU.2011.6163932}, timestamp = {Fri, 26 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/asru/KuoAMS11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/asru/ManguKCKSSB11, author = {Lidia Mangu and Hong{-}Kwang Kuo and Stephen M. Chu and Brian Kingsbury and George Saon and Hagen Soltau and Fadi Biadsy}, editor = {David Nahamoo and Michael Picheny}, title = {The {IBM} 2011 {GALE} Arabic speech transcription system}, booktitle = {2011 {IEEE} Workshop on Automatic Speech Recognition {\&} Understanding, {ASRU} 2011, Waikoloa, HI, USA, December 11-15, 2011}, pages = {272--277}, publisher = {{IEEE}}, year = {2011}, url = {https://doi.org/10.1109/ASRU.2011.6163943}, doi = {10.1109/ASRU.2011.6163943}, timestamp = {Fri, 26 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/asru/ManguKCKSSB11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/KingsburySSCKMRMJ11, author = {Brian Kingsbury and Hagen Soltau and George Saon and Stephen M. Chu and Hong{-}Kwang Kuo and Lidia Mangu and Suman V. Ravuri and Nelson Morgan and Adam Janin}, title = {The {IBM} 2009 {GALE} Arabic speech transcription system}, booktitle = {Proceedings of the {IEEE} International Conference on Acoustics, Speech, and Signal Processing, {ICASSP} 2011, May 22-27, 2011, Prague Congress Center, Prague, Czech Republic}, pages = {4672--4675}, publisher = {{IEEE}}, year = {2011}, url = {https://doi.org/10.1109/ICASSP.2011.5947397}, doi = {10.1109/ICASSP.2011.5947397}, timestamp = {Fri, 19 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/KingsburySSCKMRMJ11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/SaonC11, author = {George Saon and Jen{-}Tzung Chien}, title = {Bayesian sensing hidden Markov models for speech recognition}, booktitle = {Proceedings of the {IEEE} International Conference on Acoustics, Speech, and Signal Processing, {ICASSP} 2011, May 22-27, 2011, Prague Congress Center, Prague, Czech Republic}, pages = {5056--5059}, publisher = {{IEEE}}, year = {2011}, url = {https://doi.org/10.1109/ICASSP.2011.5947493}, doi = {10.1109/ICASSP.2011.5947493}, timestamp = {Thu, 15 Jun 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/SaonC11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/SaonC11a, author = {George Saon and Jen{-}Tzung Chien}, title = {Discriminative training for Bayesian sensing hidden Markov models}, booktitle = {Proceedings of the {IEEE} International Conference on Acoustics, Speech, and Signal Processing, {ICASSP} 2011, May 22-27, 2011, Prague Congress Center, Prague, Czech Republic}, pages = {5316--5319}, publisher = {{IEEE}}, year = {2011}, url = {https://doi.org/10.1109/ICASSP.2011.5947558}, doi = {10.1109/ICASSP.2011.5947558}, timestamp = {Thu, 15 Jun 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/SaonC11a.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/mlslp/SaonC11, author = {George Saon and Jen{-}Tzung Chien}, title = {Bayesian sensing hidden Markov models for speech recognition}, booktitle = {2011 Symposium on Machine Learning in Speech and Language Processing, {MLSLP} 2011, Bellevue, WA, USA, June 27, 2011}, publisher = {{ISCA}}, year = {2011}, url = {https://www.isca-archive.org/mlslp\_2011/saon11\_mlslp.html}, timestamp = {Thu, 01 Aug 2024 15:37:24 +0200}, biburl = {https://dblp.org/rec/conf/mlslp/SaonC11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/SaonSCCKKMP10, author = {George Saon and Hagen Soltau and Upendra V. Chaudhari and Stephen M. Chu and Brian Kingsbury and Hong{-}Kwang Kuo and Lidia Mangu and Daniel Povey}, title = {The {IBM} 2008 {GALE} Arabic speech transcription system}, booktitle = {Proceedings of the {IEEE} International Conference on Acoustics, Speech, and Signal Processing, {ICASSP} 2010, 14-19 March 2010, Sheraton Dallas Hotel, Dallas, Texas, {USA}}, pages = {4378--4381}, publisher = {{IEEE}}, year = {2010}, url = {https://doi.org/10.1109/ICASSP.2010.5495640}, doi = {10.1109/ICASSP.2010.5495640}, timestamp = {Fri, 19 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/SaonSCCKKMP10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/SaonS10, author = {George Saon and Hagen Soltau}, editor = {Takao Kobayashi and Keikichi Hirose and Satoshi Nakamura}, title = {Boosting systems for {LVCSR}}, booktitle = {11th Annual Conference of the International Speech Communication Association, {INTERSPEECH} 2010, Makuhari, Chiba, Japan, September 26-30, 2010}, pages = {1341--1344}, publisher = {{ISCA}}, year = {2010}, url = {https://doi.org/10.21437/Interspeech.2010-16}, doi = {10.21437/INTERSPEECH.2010-16}, timestamp = {Tue, 11 Jun 2024 16:45:43 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/SaonS10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/slt/SoltauSK10, author = {Hagen Soltau and George Saon and Brian Kingsbury}, editor = {Dilek Hakkani{-}T{\"{u}}r and Mari Ostendorf}, title = {The {IBM} Attila speech recognition toolkit}, booktitle = {2010 {IEEE} Spoken Language Technology Workshop, {SLT} 2010, Berkeley, California, USA, December 12-15, 2010}, pages = {97--102}, publisher = {{IEEE}}, year = {2010}, url = {https://doi.org/10.1109/SLT.2010.5700829}, doi = {10.1109/SLT.2010.5700829}, timestamp = {Wed, 16 Oct 2019 14:14:53 +0200}, biburl = {https://dblp.org/rec/conf/slt/SoltauSK10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/taslp/SoltauSKKMPE09, author = {Hagen Soltau and George Saon and Brian Kingsbury and Hong{-}Kwang Jeff Kuo and Lidia Mangu and Daniel Povey and Ahmad Emami}, title = {Advances in Arabic Speech Transcription at {IBM} Under the {DARPA} {GALE} Program}, journal = {{IEEE} Trans. Speech Audio Process.}, volume = {17}, number = {5}, pages = {884--894}, year = {2009}, url = {https://doi.org/10.1109/TASL.2009.2022966}, doi = {10.1109/TASL.2009.2022966}, timestamp = {Sun, 17 May 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/taslp/SoltauSKKMPE09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/asru/SoltauS09, author = {Hagen Soltau and George Saon}, title = {Dynamic network decoding revisited}, booktitle = {2009 {IEEE} Workshop on Automatic Speech Recognition {\&} Understanding, {ASRU} 2009, Merano/Meran, Italy, December 13-17, 2009}, pages = {276--281}, publisher = {{IEEE}}, year = {2009}, url = {https://doi.org/10.1109/ASRU.2009.5372904}, doi = {10.1109/ASRU.2009.5372904}, timestamp = {Wed, 16 Oct 2019 14:14:51 +0200}, biburl = {https://dblp.org/rec/conf/asru/SoltauS09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/SaonPS09, author = {George Saon and Daniel Povey and Hagen Soltau}, title = {Large margin semi-tied covariance transforms for discriminative training}, booktitle = {Proceedings of the {IEEE} International Conference on Acoustics, Speech, and Signal Processing, {ICASSP} 2009, 19-24 April 2009, Taipei, Taiwan}, pages = {3753--3756}, publisher = {{IEEE}}, year = {2009}, url = {https://doi.org/10.1109/ICASSP.2009.4960443}, doi = {10.1109/ICASSP.2009.4960443}, timestamp = {Thu, 23 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icassp/SaonPS09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/PoveyKKRSV08, author = {Daniel Povey and Dimitri Kanevsky and Brian Kingsbury and Bhuvana Ramabhadran and George Saon and Karthik Visweswariah}, title = {Boosted {MMI} for model and feature-space discriminative training}, booktitle = {Proceedings of the {IEEE} International Conference on Acoustics, Speech, and Signal Processing, {ICASSP} 2008, March 30 - April 4, 2008, Caesars Palace, Las Vegas, Nevada, {USA}}, pages = {4057--4060}, publisher = {{IEEE}}, year = {2008}, url = {https://doi.org/10.1109/ICASSP.2008.4518545}, doi = {10.1109/ICASSP.2008.4518545}, timestamp = {Fri, 19 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/PoveyKKRSV08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/SaonP08, author = {George Saon and Daniel Povey}, title = {Penalty function maximization for large margin {HMM} training}, booktitle = {9th Annual Conference of the International Speech Communication Association, {INTERSPEECH} 2008, Brisbane, Australia, September 22-26, 2008}, pages = {920--923}, publisher = {{ISCA}}, year = {2008}, url = {https://doi.org/10.21437/Interspeech.2008-108}, doi = {10.21437/INTERSPEECH.2008-108}, timestamp = {Tue, 11 Jun 2024 16:45:43 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/SaonP08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/asru/SaonP07, author = {George Saon and Michael Picheny}, editor = {Sadaoki Furui and Tatsuya Kawahara}, title = {Lattice-based Viterbi decoding techniques for speech translation}, booktitle = {{IEEE} Workshop on Automatic Speech Recognition {\&} Understanding, {ASRU} 2007, Kyoto, Japan, December 9-13, 2007}, pages = {386--389}, publisher = {{IEEE}}, year = {2007}, url = {https://doi.org/10.1109/ASRU.2007.4430143}, doi = {10.1109/ASRU.2007.4430143}, timestamp = {Wed, 16 Oct 2019 14:14:51 +0200}, biburl = {https://dblp.org/rec/conf/asru/SaonP07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/SoltauSKKMPZ07, author = {Hagen Soltau and George Saon and Brian Kingsbury and Hong{-}Kwang Jeff Kuo and Lidia Mangu and Daniel Povey and Geoffrey Zweig}, title = {The {IBM} 2006 Gale Arabic {ASR} System}, booktitle = {Proceedings of the {IEEE} International Conference on Acoustics, Speech, and Signal Processing, {ICASSP} 2007, Honolulu, Hawaii, USA, April 15-20, 2007}, pages = {349--352}, publisher = {{IEEE}}, year = {2007}, url = {https://doi.org/10.1109/ICASSP.2007.366921}, doi = {10.1109/ICASSP.2007.366921}, timestamp = {Mon, 22 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/SoltauSKKMPZ07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/taslp/ChenKMPSSZ06, author = {Stanley F. Chen and Brian Kingsbury and Lidia Mangu and Daniel Povey and George Saon and Hagen Soltau and Geoffrey Zweig}, title = {Advances in speech transcription at {IBM} under the {DARPA} {EARS} program}, journal = {{IEEE} Trans. Speech Audio Process.}, volume = {14}, number = {5}, pages = {1596--1608}, year = {2006}, url = {https://doi.org/10.1109/TASL.2006.879814}, doi = {10.1109/TASL.2006.879814}, timestamp = {Sun, 17 May 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/taslp/ChenKMPSSZ06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/Saon06, author = {George Saon}, title = {A Non-Linear Speaker Adaptation Technique using Kernel Ridge Regression}, booktitle = {2006 {IEEE} International Conference on Acoustics Speech and Signal Processing, {ICASSP} 2006, Toulouse, France, May 14-19, 2006}, pages = {225--228}, publisher = {{IEEE}}, year = {2006}, url = {https://doi.org/10.1109/ICASSP.2006.1659998}, doi = {10.1109/ICASSP.2006.1659998}, timestamp = {Mon, 22 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/Saon06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/ZweigSSRPMK06, author = {Geoffrey Zweig and Olivier Siohan and George Saon and Bhuvana Ramabhadran and Daniel Povey and Lidia Mangu and Brian Kingsbury}, title = {Automated Quality Monitoring in the Call Center with {ASR} and Maximum Entropy}, booktitle = {2006 {IEEE} International Conference on Acoustics Speech and Signal Processing, {ICASSP} 2006, Toulouse, France, May 14-19, 2006}, pages = {589--592}, publisher = {{IEEE}}, year = {2006}, url = {https://doi.org/10.1109/ICASSP.2006.1660089}, doi = {10.1109/ICASSP.2006.1660089}, timestamp = {Mon, 22 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/ZweigSSRPMK06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/PoveyS06, author = {Daniel Povey and George Saon}, title = {Feature and model space speaker adaptation with full covariance Gaussians}, booktitle = {Ninth International Conference on Spoken Language Processing, {INTERSPEECH-ICSLP} 2006, Pittsburgh, PA, USA, September 17-21, 2006}, publisher = {{ISCA}}, year = {2006}, url = {https://doi.org/10.21437/Interspeech.2006-349}, doi = {10.21437/INTERSPEECH.2006-349}, timestamp = {Tue, 11 Jun 2024 16:45:43 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/PoveyS06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/naacl/ZweigSSRPMK06, author = {Geoffrey Zweig and Olivier Siohan and George Saon and Bhuvana Ramabhadran and Daniel Povey and Lidia Mangu and Brian Kingsbury}, editor = {Robert C. Moore and Jeff A. Bilmes and Jennifer Chu{-}Carroll and Mark Sanderson}, title = {Automated Quality Monitoring for Call Centers using Speech and {NLP} Technologies}, booktitle = {Human Language Technology Conference of the North American Chapter of the Association of Computational Linguistics, Proceedings, June 4-9, 2006, New York, New York, {USA}}, publisher = {The Association for Computational Linguistics}, year = {2006}, url = {https://aclanthology.org/N06-4011/}, timestamp = {Fri, 06 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/naacl/ZweigSSRPMK06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/slt/SaonRZ06, author = {George Saon and Bhuvana Ramabhadran and Geoffrey Zweig}, editor = {Mazin Gilbert and Hermann Ney}, title = {On the Effect Ofword Error Rate on Automated Quality Monitoring}, booktitle = {2006 {IEEE} {ACL} Spoken Language Technology Workshop, {SLT} 2006, Palm Beach, Aruba, December 10-13, 2006}, pages = {106--109}, publisher = {{IEEE}}, year = {2006}, url = {https://doi.org/10.1109/SLT.2006.326828}, doi = {10.1109/SLT.2006.326828}, timestamp = {Wed, 16 Oct 2019 14:14:53 +0200}, biburl = {https://dblp.org/rec/conf/slt/SaonRZ06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/SoltauKMPSZ05, author = {Hagen Soltau and Brian Kingsbury and Lidia Mangu and Daniel Povey and George Saon and Geoffrey Zweig}, title = {The {IBM} 2004 Conversational Telephony System for Rich Transcription}, booktitle = {2005 {IEEE} International Conference on Acoustics, Speech, and Signal Processing, {ICASSP} '05, Philadelphia, Pennsylvania, USA, March 18-23, 2005}, pages = {205--208}, publisher = {{IEEE}}, year = {2005}, url = {https://doi.org/10.1109/ICASSP.2005.1415086}, doi = {10.1109/ICASSP.2005.1415086}, timestamp = {Mon, 22 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/SoltauKMPSZ05.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/PoveyKMSSZ05, author = {Daniel Povey and Brian Kingsbury and Lidia Mangu and George Saon and Hagen Soltau and Geoffrey Zweig}, title = {fMPE: Discriminatively Trained Features for Speech Recognition}, booktitle = {2005 {IEEE} International Conference on Acoustics, Speech, and Signal Processing, {ICASSP} '05, Philadelphia, Pennsylvania, USA, March 18-23, 2005}, pages = {961--964}, publisher = {{IEEE}}, year = {2005}, url = {https://doi.org/10.1109/ICASSP.2005.1415275}, doi = {10.1109/ICASSP.2005.1415275}, timestamp = {Mon, 22 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/PoveyKMSSZ05.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/SaonPZ05, author = {George Saon and Daniel Povey and Geoffrey Zweig}, title = {Anatomy of an extremely fast {LVCSR} decoder}, booktitle = {9th European Conference on Speech Communication and Technology, INTERSPEECH-Eurospeech 2005, Lisbon, Portugal, September 4-8, 2005}, pages = {549--552}, publisher = {{ISCA}}, year = {2005}, url = {https://doi.org/10.21437/Interspeech.2005-338}, doi = {10.21437/INTERSPEECH.2005-338}, timestamp = {Tue, 11 Jun 2024 16:45:43 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/SaonPZ05.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/csl/YvonZS04, author = {Fran{\c{c}}ois Yvon and Geoffrey Zweig and George Saon}, title = {Arc minimization in finite-state decoding graphs with cross-word acoustic context}, journal = {Comput. Speech Lang.}, volume = {18}, number = {4}, pages = {397--415}, year = {2004}, url = {https://doi.org/10.1016/j.csl.2003.09.006}, doi = {10.1016/J.CSL.2003.09.006}, timestamp = {Thu, 20 Feb 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/csl/YvonZS04.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/SarikayaGS04, author = {Ruhi Sarikaya and Yuqing Gao and George Saon}, title = {Fractional Fourier transform features for speech recognition}, booktitle = {2004 {IEEE} International Conference on Acoustics, Speech, and Signal Processing, {ICASSP} 2004, Montreal, Quebec, Canada, May 17-21, 2004}, pages = {52}, publisher = {{IEEE}}, year = {2004}, url = {https://doi.org/10.1109/ICASSP.2004.1326039}, doi = {10.1109/ICASSP.2004.1326039}, timestamp = {Mon, 22 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/SarikayaGS04.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/SaonDP04, author = {George Saon and Satya Dharanipragada and Daniel Povey}, title = {Feature space Gaussianization}, booktitle = {2004 {IEEE} International Conference on Acoustics, Speech, and Signal Processing, {ICASSP} 2004, Montreal, Quebec, Canada, May 17-21, 2004}, pages = {329--332}, publisher = {{IEEE}}, year = {2004}, url = {https://doi.org/10.1109/ICASSP.2004.1325989}, doi = {10.1109/ICASSP.2004.1325989}, timestamp = {Mon, 28 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/SaonDP04.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/KingsburyMSZAGVP03, author = {Brian Kingsbury and Lidia Mangu and George Saon and Geoffrey Zweig and Scott Axelrod and Vaibhava Goel and Karthik Visweswariah and Michael Picheny}, title = {Toward domain-independent conversational speech recognition}, booktitle = {8th European Conference on Speech Communication and Technology, {EUROSPEECH} 2003 - {INTERSPEECH} 2003, Geneva, Switzerland, September 1-4, 2003}, pages = {1881--1884}, publisher = {{ISCA}}, year = {2003}, url = {https://doi.org/10.21437/Eurospeech.2003-566}, doi = {10.21437/EUROSPEECH.2003-566}, timestamp = {Thu, 22 Jun 2023 16:42:17 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/KingsburyMSZAGVP03.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/SaonZKMC03, author = {George Saon and Geoffrey Zweig and Brian Kingsbury and Lidia Mangu and Upendra V. Chaudhari}, title = {An architecture for rapid decoding of large vocabulary conversational speech}, booktitle = {8th European Conference on Speech Communication and Technology, {EUROSPEECH} 2003 - {INTERSPEECH} 2003, Geneva, Switzerland, September 1-4, 2003}, pages = {1977--1980}, publisher = {{ISCA}}, year = {2003}, url = {https://doi.org/10.21437/Eurospeech.2003-571}, doi = {10.21437/EUROSPEECH.2003-571}, timestamp = {Thu, 22 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/SaonZKMC03.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/taslp/PadmanabhanSHKM02, author = {Mukund Padmanabhan and George Saon and Jing Huang and Brian Kingsbury and Lidia Mangu}, title = {Automatic speech recognition performance on a voicemail transcription task}, journal = {{IEEE} Trans. Speech Audio Process.}, volume = {10}, number = {7}, pages = {433--442}, year = {2002}, url = {https://doi.org/10.1109/TSA.2002.804303}, doi = {10.1109/TSA.2002.804303}, timestamp = {Sun, 17 May 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/taslp/PadmanabhanSHKM02.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/FineSG02, author = {Shai Fine and George Saon and Ramesh A. Gopinath}, title = {Digit recognition in noisy environments via a sequential {GMM/SVM} system}, booktitle = {Proceedings of the {IEEE} International Conference on Acoustics, Speech, and Signal Processing, {ICASSP} 2002, May 13-17 2002, Orlando, Florida, {USA}}, pages = {49--52}, publisher = {{IEEE}}, year = {2002}, url = {https://doi.org/10.1109/ICASSP.2002.5743651}, doi = {10.1109/ICASSP.2002.5743651}, timestamp = {Wed, 16 Oct 2019 14:14:52 +0200}, biburl = {https://dblp.org/rec/conf/icassp/FineSG02.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/KingsburySMPS02, author = {Brian Kingsbury and George Saon and Lidia Mangu and Mukund Padmanabhan and Ruhi Sarikaya}, title = {Robust speech recognition in Noisy Environments: The 2001 {IBM} spine evaluation system}, booktitle = {Proceedings of the {IEEE} International Conference on Acoustics, Speech, and Signal Processing, {ICASSP} 2002, May 13-17 2002, Orlando, Florida, {USA}}, pages = {53--56}, publisher = {{IEEE}}, year = {2002}, url = {https://doi.org/10.1109/ICASSP.2002.5743652}, doi = {10.1109/ICASSP.2002.5743652}, timestamp = {Fri, 19 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/KingsburySMPS02.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/ZweigSY02, author = {Geoffrey Zweig and George Saon and Fran{\c{c}}ois Yvon}, editor = {John H. L. Hansen and Bryan L. Pellom}, title = {Arc minimization in finite state decoding graphs with cross-word acoustic context}, booktitle = {7th International Conference on Spoken Language Processing, {ICSLP2002} - {INTERSPEECH} 2002, Denver, Colorado, USA, September 16-20, 2002}, pages = {389--392}, publisher = {{ISCA}}, year = {2002}, url = {https://doi.org/10.21437/ICSLP.2002-162}, doi = {10.21437/ICSLP.2002-162}, timestamp = {Thu, 22 Jun 2023 16:42:18 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/ZweigSY02.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/SaonH02, author = {George Saon and Juan M. Huerta}, editor = {John H. L. Hansen and Bryan L. Pellom}, title = {Improvements to the {IBM} Aurora 2 multi-condition system}, booktitle = {7th International Conference on Spoken Language Processing, {ICSLP2002} - {INTERSPEECH} 2002, Denver, Colorado, USA, September 16-20, 2002}, pages = {469--472}, publisher = {{ISCA}}, year = {2002}, url = {https://doi.org/10.21437/ICSLP.2002-21}, doi = {10.21437/ICSLP.2002-21}, timestamp = {Thu, 22 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/SaonH02.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/taslp/SaonP01, author = {George Saon and Mukund Padmanabhan}, title = {Data-driven approach to designing compound words for continuous speech recognition}, journal = {{IEEE} Trans. Speech Audio Process.}, volume = {9}, number = {4}, pages = {327--332}, year = {2001}, url = {https://doi.org/10.1109/89.917678}, doi = {10.1109/89.917678}, timestamp = {Sun, 17 May 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/taslp/SaonP01.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/SaonZP01, author = {George Saon and Geoffrey Zweig and Mukund Padmanabhan}, title = {Linear feature space projections for speaker adaptation}, booktitle = {{IEEE} International Conference on Acoustics, Speech, and Signal Processing, {ICASSP} 2001, 7-11 May, 2001, Salt Palace Convention Center, Salt Lake City, Utah, USA, Proceedings}, pages = {325--328}, publisher = {{IEEE}}, year = {2001}, url = {https://doi.org/10.1109/ICASSP.2001.940833}, doi = {10.1109/ICASSP.2001.940833}, timestamp = {Thu, 23 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icassp/SaonZP01.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/AaronCCDEFLLMMMNOPPRSSTVY01, author = {Andrew Aaron and Scott Saobing Chen and Paul S. Cohen and Satya Dharanipragada and Ellen Eide and Martin Franz and Jean{-}Michel LeRoux and X. Luo and Beno{\^{\i}}t Maison and Lidia Mangu and T. Mathes and Miroslav Novak and Peder A. Olsen and Michael Picheny and Harry Printz and Bhuvana Ramabhadran and Andrej Sakrajda and George Saon and Borivoj Tydlit{\'{a}}t and Karthik Visweswariah and D. Yuk}, title = {Speech recognition for {DARPA} Communicator}, booktitle = {{IEEE} International Conference on Acoustics, Speech, and Signal Processing, {ICASSP} 2001, 7-11 May, 2001, Salt Palace Convention Center, Salt Lake City, Utah, USA, Proceedings}, pages = {489--492}, publisher = {{IEEE}}, year = {2001}, url = {https://doi.org/10.1109/ICASSP.2001.940874}, doi = {10.1109/ICASSP.2001.940874}, timestamp = {Thu, 23 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icassp/AaronCCDEFLLMMMNOPPRSSTVY01.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/SaonHJ01, author = {George Saon and Juan M. Huerta and Ea{-}Ee Jan}, editor = {Paul Dalsgaard and B{\o}rge Lindberg and Henrik Benner and Zheng{-}Hua Tan}, title = {Robust digit recognition in noisy environments: the {IBM} Aurora 2 system}, booktitle = {{EUROSPEECH} 2001 Scandinavia, 7th European Conference on Speech Communication and Technology, 2nd {INTERSPEECH} Event, Aalborg, Denmark, September 3-7, 2001}, pages = {629--632}, publisher = {{ISCA}}, year = {2001}, url = {https://doi.org/10.21437/Eurospeech.2001-166}, doi = {10.21437/EUROSPEECH.2001-166}, timestamp = {Thu, 22 Jun 2023 16:42:18 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/SaonHJ01.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/SaonPGC00, author = {George Saon and Mukund Padmanabhan and Ramesh A. Gopinath and Scott Saobing Chen}, title = {Maximum likelihood discriminant feature spaces}, booktitle = {{IEEE} International Conference on Acoustics, Speech, and Signal Processing. {ICASSP} 2000, 5-9 June, 2000, Hilton Hotel and Convention Center, Istanbul, Turkey}, pages = {1129--1132}, publisher = {{IEEE}}, year = {2000}, url = {https://doi.org/10.1109/ICASSP.2000.859163}, doi = {10.1109/ICASSP.2000.859163}, timestamp = {Thu, 23 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icassp/SaonPGC00.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/SaonP00, author = {George Saon and Mukund Padmanabhan}, title = {Minimum Bayes error feature selection}, booktitle = {Sixth International Conference on Spoken Language Processing, {ICSLP} 2000 / {INTERSPEECH} 2000, Beijing, China, October 16-20, 2000}, pages = {75--78}, publisher = {{ISCA}}, year = {2000}, url = {https://doi.org/10.21437/ICSLP.2000-481}, doi = {10.21437/ICSLP.2000-481}, timestamp = {Thu, 22 Jun 2023 16:42:19 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/SaonP00.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/HuangKMPSZ00, author = {Jing Huang and Brian Kingsbury and Lidia Mangu and Mukund Padmanabhan and George Saon and Geoffrey Zweig}, title = {Recent improvements in speech recognition performance on large vocabulary conversational speech (voicemail and switchboard)}, booktitle = {Sixth International Conference on Spoken Language Processing, {ICSLP} 2000 / {INTERSPEECH} 2000, Beijing, China, October 16-20, 2000}, pages = {338--341}, publisher = {{ISCA}}, year = {2000}, url = {https://doi.org/10.21437/ICSLP.2000-819}, doi = {10.21437/ICSLP.2000-819}, timestamp = {Thu, 22 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/HuangKMPSZ00.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/JanOSR00, author = {Ea{-}Ee Jan and Jaime Botella Ordinas and George Saon and Salim Roukos}, title = {Real-time multilingual {HMM} training robust to channel variations}, booktitle = {Sixth International Conference on Spoken Language Processing, {ICSLP} 2000 / {INTERSPEECH} 2000, Beijing, China, October 16-20, 2000}, pages = {925--928}, publisher = {{ISCA}}, year = {2000}, url = {https://doi.org/10.21437/ICSLP.2000-685}, doi = {10.21437/ICSLP.2000-685}, timestamp = {Thu, 22 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/JanOSR00.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/SaonP00, author = {George Saon and Mukund Padmanabhan}, editor = {Todd K. Leen and Thomas G. Dietterich and Volker Tresp}, title = {Minimum Bayes Error Feature Selection for Continuous Speech Recognition}, booktitle = {Advances in Neural Information Processing Systems 13, Papers from Neural Information Processing Systems {(NIPS)} 2000, Denver, CO, {USA}}, pages = {800--806}, publisher = {{MIT} Press}, year = {2000}, url = {https://proceedings.neurips.cc/paper/2000/hash/59e0b2658e9f2e77f8d4d83f8d07ca84-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/SaonP00.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ijdar/Saon99, author = {George Saon}, title = {Cursive word recognition using a random field based hidden Markov model}, journal = {Int. J. Document Anal. Recognit.}, volume = {1}, number = {4}, pages = {199--208}, year = {1999}, url = {https://doi.org/10.1007/s100320050019}, doi = {10.1007/S100320050019}, timestamp = {Thu, 13 Aug 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ijdar/Saon99.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/PadmanabhanSBHZ99, author = {Mukund Padmanabhan and George Saon and Sankar Basu and Jing Huang and Geoffrey Zweig}, title = {Recent improvements in voicemail transcription}, booktitle = {Sixth European Conference on Speech Communication and Technology, {EUROSPEECH} 1999, Budapest, Hungary, September 5-9, 1999}, pages = {503--506}, publisher = {{ISCA}}, year = {1999}, url = {https://doi.org/10.21437/Eurospeech.1999-129}, doi = {10.21437/EUROSPEECH.1999-129}, timestamp = {Wed, 18 Sep 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/PadmanabhanSBHZ99.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@phdthesis{DBLP:phd/hal/Saon97, author = {George Saon}, title = {Mod{\`{e}}les markoviens uni- et bidimensionnels pour la reconnaissance de l'{\'{e}}criture manuscrite hors-ligne. (One and two-dimensional Markov models for off-line handwriting recognition)}, school = {Henri Poincar{\'{e}} University, Nancy, France}, year = {1997}, url = {https://hal.archives-ouvertes.fr/tel-01747325}, timestamp = {Thu, 12 May 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/phd/hal/Saon97.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ijprai/SaonB97, author = {George Saon and Abdel Bela{\"{\i}}d}, title = {High Performance Unconstrained Word Recognition System Combining HMMs and Markov Random Fields}, journal = {Int. J. Pattern Recognit. Artif. Intell.}, volume = {11}, number = {5}, pages = {771--788}, year = {1997}, url = {https://doi.org/10.1142/S0218001497000342}, doi = {10.1142/S0218001497000342}, timestamp = {Mon, 11 May 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ijprai/SaonB97.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/SaonB97, author = {George Saon and Abdel Bela{\"{\i}}d}, title = {Binary pattern recognition using Markov random fields and HMMs}, booktitle = {1997 {IEEE} International Conference on Acoustics, Speech, and Signal Processing, {ICASSP} '97, Munich, Germany, April 21-24, 1997}, pages = {3725--3728}, publisher = {{IEEE} Computer Society}, year = {1997}, url = {https://doi.org/10.1109/ICASSP.1997.604678}, doi = {10.1109/ICASSP.1997.604678}, timestamp = {Thu, 23 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icassp/SaonB97.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icdar/SaonBG95, author = {George Saon and Abdel Bela{\"{\i}}d and Yifan Gong}, title = {Stochastic trajectory modeling for recognition of unconstrained handwritten words}, booktitle = {Third International Conference on Document Analysis and Recognition, {ICDAR} 1995, August 14 - 15, 1995, Montreal, Canada. Volume {I}}, pages = {508--511}, publisher = {{IEEE} Computer Society}, year = {1995}, url = {https://doi.org/10.1109/ICDAR.1995.599045}, doi = {10.1109/ICDAR.1995.599045}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icdar/SaonBG95.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/mva/SaonBG94, author = {George Saon and Abdel Bela{\"{\i}}d and Yifan Gong}, title = {Off-line Handwriting Recognition by Statistical Correlation}, booktitle = {Proceedings of {IAPR} Workshop on Machine Vision Applications, {MVA} 1994, December 13-15, 1994, Kawasaki, Japan}, pages = {371--374}, year = {1994}, url = {http://b2.cvl.iis.u-tokyo.ac.jp/mva/proceedings/CommemorativeDVD/1994/papers/1994371.pdf}, timestamp = {Wed, 19 May 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/mva/SaonBG94.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
manage site settings
To protect your privacy, all features that rely on external API calls from your browser are turned off by default. You need to opt-in for them to become active. All settings here will be stored as cookies with your web browser. For more information see our F.A.Q.