BibTeX records: Michiel Bacchiani

download as .bib file

@inproceedings{DBLP:conf/waspaa/KoizumiZKDYMZHBB23,
  author       = {Yuma Koizumi and
                  Heiga Zen and
                  Shigeki Karita and
                  Yifan Ding and
                  Kohei Yatabe and
                  Nobuyuki Morioka and
                  Yu Zhang and
                  Wei Han and
                  Ankur Bapna and
                  Michiel Bacchiani},
  title        = {Miipher: {A} Robust Speech Restoration Model Integrating Self-Supervised
                  Speech and Text Representations},
  booktitle    = {{IEEE} Workshop on Applications of Signal Processing to Audio and
                  Acoustics, {WASPAA} 2023, New Paltz, NY, USA, October 22-25, 2023},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/WASPAA58266.2023.10248089},
  doi          = {10.1109/WASPAA58266.2023.10248089},
  timestamp    = {Sat, 23 Sep 2023 11:31:10 +0200},
  biburl       = {https://dblp.org/rec/conf/waspaa/KoizumiZKDYMZHBB23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2303-01664,
  author       = {Yuma Koizumi and
                  Heiga Zen and
                  Shigeki Karita and
                  Yifan Ding and
                  Kohei Yatabe and
                  Nobuyuki Morioka and
                  Yu Zhang and
                  Wei Han and
                  Ankur Bapna and
                  Michiel Bacchiani},
  title        = {Miipher: {A} Robust Speech Restoration Model Integrating Self-Supervised
                  Speech and Text Representations},
  journal      = {CoRR},
  volume       = {abs/2303.01664},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2303.01664},
  doi          = {10.48550/ARXIV.2303.01664},
  eprinttype    = {arXiv},
  eprint       = {2303.01664},
  timestamp    = {Fri, 22 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2303-01664.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-18802,
  author       = {Yuma Koizumi and
                  Heiga Zen and
                  Shigeki Karita and
                  Yifan Ding and
                  Kohei Yatabe and
                  Nobuyuki Morioka and
                  Michiel Bacchiani and
                  Yu Zhang and
                  Wei Han and
                  Ankur Bapna},
  title        = {LibriTTS-R: {A} Restored Multi-Speaker Text-to-Speech Corpus},
  journal      = {CoRR},
  volume       = {abs/2305.18802},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.18802},
  doi          = {10.48550/ARXIV.2305.18802},
  eprinttype    = {arXiv},
  eprint       = {2305.18802},
  timestamp    = {Fri, 22 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-18802.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/KuboKB22,
  author       = {Yotaro Kubo and
                  Shigeki Karita and
                  Michiel Bacchiani},
  title        = {Knowledge Transfer from Large-Scale Pretrained Language Models to
                  End-To-End Speech Recognizers},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2022, Virtual and Singapore, 23-27 May 2022},
  pages        = {8512--8516},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/ICASSP43922.2022.9746801},
  doi          = {10.1109/ICASSP43922.2022.9746801},
  timestamp    = {Tue, 07 Jun 2022 17:34:47 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/KuboKB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/KoizumiZYCB22,
  author       = {Yuma Koizumi and
                  Heiga Zen and
                  Kohei Yatabe and
                  Nanxin Chen and
                  Michiel Bacchiani},
  editor       = {Hanseok Ko and
                  John H. L. Hansen},
  title        = {SpecGrad: Diffusion Probabilistic Model based Neural Vocoder with
                  Adaptive Noise Spectral Shaping},
  booktitle    = {Interspeech 2022, 23rd Annual Conference of the International Speech
                  Communication Association, Incheon, Korea, 18-22 September 2022},
  pages        = {803--807},
  publisher    = {{ISCA}},
  year         = {2022},
  url          = {https://doi.org/10.21437/Interspeech.2022-301},
  doi          = {10.21437/INTERSPEECH.2022-301},
  timestamp    = {Wed, 21 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/KoizumiZYCB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/KoizumiKNPB22,
  author       = {Yuma Koizumi and
                  Shigeki Karita and
                  Arun Narayanan and
                  Sankaran Panchapagesan and
                  Michiel Bacchiani},
  editor       = {Hanseok Ko and
                  John H. L. Hansen},
  title        = {SNRi Target Training for Joint Speech Enhancement and Recognition},
  booktitle    = {Interspeech 2022, 23rd Annual Conference of the International Speech
                  Communication Association, Incheon, Korea, 18-22 September 2022},
  pages        = {1173--1177},
  publisher    = {{ISCA}},
  year         = {2022},
  url          = {https://doi.org/10.21437/Interspeech.2022-302},
  doi          = {10.21437/INTERSPEECH.2022-302},
  timestamp    = {Wed, 21 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/KoizumiKNPB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/slt/KoizumiYZB22,
  author       = {Yuma Koizumi and
                  Kohei Yatabe and
                  Heiga Zen and
                  Michiel Bacchiani},
  title        = {Wavefit: an Iterative and Non-Autoregressive Neural Vocoder Based
                  on Fixed-Point Iteration},
  booktitle    = {{IEEE} Spoken Language Technology Workshop, {SLT} 2022, Doha, Qatar,
                  January 9-12, 2023},
  pages        = {884--891},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/SLT54892.2023.10022496},
  doi          = {10.1109/SLT54892.2023.10022496},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/slt/KoizumiYZB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2202-07894,
  author       = {Yotaro Kubo and
                  Shigeki Karita and
                  Michiel Bacchiani},
  title        = {Knowledge Transfer from Large-scale Pretrained Language Models to
                  End-to-end Speech Recognizers},
  journal      = {CoRR},
  volume       = {abs/2202.07894},
  year         = {2022},
  url          = {https://arxiv.org/abs/2202.07894},
  eprinttype    = {arXiv},
  eprint       = {2202.07894},
  timestamp    = {Tue, 01 Mar 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2202-07894.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2203-16749,
  author       = {Yuma Koizumi and
                  Heiga Zen and
                  Kohei Yatabe and
                  Nanxin Chen and
                  Michiel Bacchiani},
  title        = {SpecGrad: Diffusion Probabilistic Model based Neural Vocoder with
                  Adaptive Noise Spectral Shaping},
  journal      = {CoRR},
  volume       = {abs/2203.16749},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2203.16749},
  doi          = {10.48550/ARXIV.2203.16749},
  eprinttype    = {arXiv},
  eprint       = {2203.16749},
  timestamp    = {Tue, 05 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2203-16749.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-01029,
  author       = {Yuma Koizumi and
                  Kohei Yatabe and
                  Heiga Zen and
                  Michiel Bacchiani},
  title        = {WaveFit: An Iterative and Non-autoregressive Neural Vocoder based
                  on Fixed-Point Iteration},
  journal      = {CoRR},
  volume       = {abs/2210.01029},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.01029},
  doi          = {10.48550/ARXIV.2210.01029},
  eprinttype    = {arXiv},
  eprint       = {2210.01029},
  timestamp    = {Fri, 07 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-01029.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/KaritaKBJ21,
  author       = {Shigeki Karita and
                  Yotaro Kubo and
                  Michiel Adriaan Unico Bacchiani and
                  Llion Jones},
  editor       = {Hynek Hermansky and
                  Honza Cernock{\'{y}} and
                  Luk{\'{a}}s Burget and
                  Lori Lamel and
                  Odette Scharenborg and
                  Petr Motl{\'{\i}}cek},
  title        = {A Comparative Study on Neural Architectures and Training Methods for
                  Japanese Speech Recognition},
  booktitle    = {Interspeech 2021, 22nd Annual Conference of the International Speech
                  Communication Association, Brno, Czechia, 30 August - 3 September
                  2021},
  pages        = {2092--2096},
  publisher    = {{ISCA}},
  year         = {2021},
  url          = {https://doi.org/10.21437/Interspeech.2021-775},
  doi          = {10.21437/INTERSPEECH.2021-775},
  timestamp    = {Wed, 21 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/KaritaKBJ21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/waspaa/KoizumiKWEHJB21,
  author       = {Yuma Koizumi and
                  Shigeki Karita and
                  Scott Wisdom and
                  Hakan Erdogan and
                  John R. Hershey and
                  Llion Jones and
                  Michiel Bacchiani},
  title        = {DF-Conformer: Integrated Architecture of Conv-Tasnet and Conformer
                  Using Linear Complexity Self-Attention for Speech Enhancement},
  booktitle    = {{IEEE} Workshop on Applications of Signal Processing to Audio and
                  Acoustics, {WASPAA} 2021, New Paltz, NY, USA, October 17-20, 2021},
  pages        = {161--165},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/WASPAA52581.2021.9632794},
  doi          = {10.1109/WASPAA52581.2021.9632794},
  timestamp    = {Tue, 21 Dec 2021 10:11:15 +0100},
  biburl       = {https://dblp.org/rec/conf/waspaa/KoizumiKWEHJB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-05111,
  author       = {Shigeki Karita and
                  Yotaro Kubo and
                  Michiel Adriaan Unico Bacchiani and
                  Llion Jones},
  title        = {A Comparative Study on Neural Architectures and Training Methods for
                  Japanese Speech Recognition},
  journal      = {CoRR},
  volume       = {abs/2106.05111},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.05111},
  eprinttype    = {arXiv},
  eprint       = {2106.05111},
  timestamp    = {Tue, 15 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-05111.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-15813,
  author       = {Yuma Koizumi and
                  Shigeki Karita and
                  Scott Wisdom and
                  Hakan Erdogan and
                  John R. Hershey and
                  Llion Jones and
                  Michiel Bacchiani},
  title        = {DF-Conformer: Integrated architecture of Conv-TasNet and Conformer
                  using linear complexity self-attention for speech enhancement},
  journal      = {CoRR},
  volume       = {abs/2106.15813},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.15813},
  eprinttype    = {arXiv},
  eprint       = {2106.15813},
  timestamp    = {Mon, 05 Jul 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-15813.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2111-00764,
  author       = {Yuma Koizumi and
                  Shigeki Karita and
                  Arun Narayanan and
                  Sankaran Panchapagesan and
                  Michiel Bacchiani},
  title        = {SNRi Target Training for Joint Speech Enhancement and Recognition},
  journal      = {CoRR},
  volume       = {abs/2111.00764},
  year         = {2021},
  url          = {https://arxiv.org/abs/2111.00764},
  eprinttype    = {arXiv},
  eprint       = {2111.00764},
  timestamp    = {Fri, 05 Nov 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2111-00764.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/KuboB20,
  author       = {Yotaro Kubo and
                  Michiel Bacchiani},
  title        = {Joint Phoneme-Grapheme Model for End-To-End Speech Recognition},
  booktitle    = {2020 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2020, Barcelona, Spain, May 4-8, 2020},
  pages        = {6119--6123},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/ICASSP40776.2020.9054557},
  doi          = {10.1109/ICASSP40776.2020.9054557},
  timestamp    = {Thu, 23 Jul 2020 16:19:28 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/KuboB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jstsp/WatanabeABHS19,
  author       = {Shinji Watanabe and
                  Shoko Araki and
                  Michiel Bacchiani and
                  Reinhold Haeb{-}Umbach and
                  Michael L. Seltzer},
  title        = {Introduction to the Issue on Far-Field Speech Processing in the Era
                  of Deep Learning: Speech Enhancement, Separation, and Recognition},
  journal      = {{IEEE} J. Sel. Top. Signal Process.},
  volume       = {13},
  number       = {4},
  pages        = {785--786},
  year         = {2019},
  url          = {https://doi.org/10.1109/JSTSP.2019.2925640},
  doi          = {10.1109/JSTSP.2019.2925640},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jstsp/WatanabeABHS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/spm/Haeb-UmbachWNBH19,
  author       = {Reinhold Haeb{-}Umbach and
                  Shinji Watanabe and
                  Tomohiro Nakatani and
                  Michiel Bacchiani and
                  Bj{\"{o}}rn Hoffmeister and
                  Michael L. Seltzer and
                  Heiga Zen and
                  Mehrez Souden},
  title        = {Speech Processing for Digital Home Assistants: Combining signal processing
                  with deep-learning techniques},
  journal      = {{IEEE} Signal Process. Mag.},
  volume       = {36},
  number       = {6},
  pages        = {111--124},
  year         = {2019},
  url          = {https://doi.org/10.1109/MSP.2019.2918706},
  doi          = {10.1109/MSP.2019.2918706},
  timestamp    = {Fri, 26 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/spm/Haeb-UmbachWNBH19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1902-08295,
  author       = {Jonathan Shen and
                  Patrick Nguyen and
                  Yonghui Wu and
                  Zhifeng Chen and
                  Mia Xu Chen and
                  Ye Jia and
                  Anjuli Kannan and
                  Tara N. Sainath and
                  Yuan Cao and
                  Chung{-}Cheng Chiu and
                  Yanzhang He and
                  Jan Chorowski and
                  Smit Hinsu and
                  Stella Laurenzo and
                  James Qin and
                  Orhan Firat and
                  Wolfgang Macherey and
                  Suyog Gupta and
                  Ankur Bapna and
                  Shuyuan Zhang and
                  Ruoming Pang and
                  Ron J. Weiss and
                  Rohit Prabhavalkar and
                  Qiao Liang and
                  Benoit Jacob and
                  Bowen Liang and
                  HyoukJoong Lee and
                  Ciprian Chelba and
                  S{\'{e}}bastien Jean and
                  Bo Li and
                  Melvin Johnson and
                  Rohan Anil and
                  Rajat Tibrewal and
                  Xiaobing Liu and
                  Akiko Eriguchi and
                  Navdeep Jaitly and
                  Naveen Ari and
                  Colin Cherry and
                  Parisa Haghani and
                  Otavio Good and
                  Youlong Cheng and
                  Raziel Alvarez and
                  Isaac Caswell and
                  Wei{-}Ning Hsu and
                  Zongheng Yang and
                  Kuan{-}Chieh Wang and
                  Ekaterina Gonina and
                  Katrin Tomanek and
                  Ben Vanik and
                  Zelin Wu and
                  Llion Jones and
                  Mike Schuster and
                  Yanping Huang and
                  Dehao Chen and
                  Kazuki Irie and
                  George F. Foster and
                  John Richardson and
                  Klaus Macherey and
                  Antoine Bruguier and
                  Heiga Zen and
                  Colin Raffel and
                  Shankar Kumar and
                  Kanishka Rao and
                  David Rybach and
                  Matthew Murray and
                  Vijayaditya Peddinti and
                  Maxim Krikun and
                  Michiel Bacchiani and
                  Thomas B. Jablin and
                  Robert Suderman and
                  Ian Williams and
                  Benjamin Lee and
                  Deepti Bhatia and
                  Justin Carlson and
                  Semih Yavuz and
                  Yu Zhang and
                  Ian McGraw and
                  Max Galkin and
                  Qi Ge and
                  Golan Pundak and
                  Chad Whipkey and
                  Todd Wang and
                  Uri Alon and
                  Dmitry Lepikhin and
                  Ye Tian and
                  Sara Sabour and
                  William Chan and
                  Shubham Toshniwal and
                  Baohua Liao and
                  Michael Nirschl and
                  Pat Rondon},
  title        = {Lingvo: a Modular and Scalable Framework for Sequence-to-Sequence
                  Modeling},
  journal      = {CoRR},
  volume       = {abs/1902.08295},
  year         = {2019},
  url          = {http://arxiv.org/abs/1902.08295},
  eprinttype    = {arXiv},
  eprint       = {1902.08295},
  timestamp    = {Tue, 07 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1902-08295.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/spm/BacchianiF18,
  author       = {Michiel Bacchiani and
                  Eric Fosler{-}Lussier},
  title        = {An Overview of the {IEEE} {SPS} Speech and Language Technical Committee
                  [In the Spotlight]},
  journal      = {{IEEE} Signal Process. Mag.},
  volume       = {35},
  number       = {6},
  pages        = {125--126},
  year         = {2018},
  url          = {https://doi.org/10.1109/MSP.2018.2863099},
  doi          = {10.1109/MSP.2018.2863099},
  timestamp    = {Sat, 01 Dec 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/spm/BacchianiF18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/LiSSBWNCWR18,
  author       = {Bo Li and
                  Tara N. Sainath and
                  Khe Chai Sim and
                  Michiel Bacchiani and
                  Eugene Weinstein and
                  Patrick Nguyen and
                  Zhifeng Chen and
                  Yanghui Wu and
                  Kanishka Rao},
  title        = {Multi-Dialect Speech Recognition with a Single Sequence-to-Sequence
                  Model},
  booktitle    = {2018 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2018, Calgary, AB, Canada, April 15-20, 2018},
  pages        = {4749--4753},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/ICASSP.2018.8461886},
  doi          = {10.1109/ICASSP.2018.8461886},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/LiSSBWNCWR18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/ChiuSWPNCKWRGJL18,
  author       = {Chung{-}Cheng Chiu and
                  Tara N. Sainath and
                  Yonghui Wu and
                  Rohit Prabhavalkar and
                  Patrick Nguyen and
                  Zhifeng Chen and
                  Anjuli Kannan and
                  Ron J. Weiss and
                  Kanishka Rao and
                  Ekaterina Gonina and
                  Navdeep Jaitly and
                  Bo Li and
                  Jan Chorowski and
                  Michiel Bacchiani},
  title        = {State-of-the-Art Speech Recognition with Sequence-to-Sequence Models},
  booktitle    = {2018 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2018, Calgary, AB, Canada, April 15-20, 2018},
  pages        = {4774--4778},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/ICASSP.2018.8462105},
  doi          = {10.1109/ICASSP.2018.8462105},
  timestamp    = {Sat, 19 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/ChiuSWPNCKWRGJL18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/VarianiBLMB18,
  author       = {Ehsan Variani and
                  Tom Bagby and
                  Kamel Lahouel and
                  Erik McDermott and
                  Michiel Bacchiani},
  title        = {Sampled Connectionist Temporal Classification},
  booktitle    = {2018 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2018, Calgary, AB, Canada, April 15-20, 2018},
  pages        = {4959--4963},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/ICASSP.2018.8461929},
  doi          = {10.1109/ICASSP.2018.8461929},
  timestamp    = {Tue, 18 Sep 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/VarianiBLMB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/KimMBS18,
  author       = {Chanwoo Kim and
                  Anjali Menon and
                  Michiel Bacchiani and
                  Richard M. Stern},
  title        = {Sound Source Separation Using Phase Difference and Reliable Mask Selection
                  Selection},
  booktitle    = {2018 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2018, Calgary, AB, Canada, April 15-20, 2018},
  pages        = {5559--5563},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/ICASSP.2018.8462269},
  doi          = {10.1109/ICASSP.2018.8462269},
  timestamp    = {Mon, 24 Apr 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/KimMBS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/KimSNMNB18,
  author       = {Chanwoo Kim and
                  Tara N. Sainath and
                  Arun Narayanan and
                  Ananya Misra and
                  Rajeev C. Nongpiur and
                  Michiel Bacchiani},
  title        = {Spectral Distortion Model for Training Phase-Sensitive Deep-Neural
                  Networks for Far-Field Speech Recognition},
  booktitle    = {2018 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2018, Calgary, AB, Canada, April 15-20, 2018},
  pages        = {5729--5733},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/ICASSP.2018.8462223},
  doi          = {10.1109/ICASSP.2018.8462223},
  timestamp    = {Mon, 24 Apr 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/KimSNMNB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/HeymannBS18,
  author       = {Jahn Heymann and
                  Michiel Bacchiani and
                  Tara N. Sainath},
  title        = {Performance of Mask Based Statistical Beamforming in a Smart Home
                  Scenario},
  booktitle    = {2018 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2018, Calgary, AB, Canada, April 15-20, 2018},
  pages        = {6722--6726},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/ICASSP.2018.8462372},
  doi          = {10.1109/ICASSP.2018.8462372},
  timestamp    = {Tue, 18 Sep 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/HeymannBS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/SimNMTPSHLB18,
  author       = {Khe Chai Sim and
                  Arun Narayanan and
                  Ananya Misra and
                  Anshuman Tripathi and
                  Golan Pundak and
                  Tara N. Sainath and
                  Parisa Haghani and
                  Bo Li and
                  Michiel Bacchiani},
  editor       = {B. Yegnanarayana},
  title        = {Domain Adaptation Using Factorized Hidden Layer for Robust Automatic
                  Speech Recognition},
  booktitle    = {Interspeech 2018, 19th Annual Conference of the International Speech
                  Communication Association, Hyderabad, India, 2-6 September 2018},
  pages        = {892--896},
  publisher    = {{ISCA}},
  year         = {2018},
  url          = {https://doi.org/10.21437/Interspeech.2018-2246},
  doi          = {10.21437/INTERSPEECH.2018-2246},
  timestamp    = {Fri, 21 May 2021 08:16:43 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/SimNMTPSHLB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/KimVNB18,
  author       = {Chanwoo Kim and
                  Ehsan Variani and
                  Arun Narayanan and
                  Michiel Bacchiani},
  editor       = {B. Yegnanarayana},
  title        = {Efficient Implementation of the Room Simulator for Training Deep Neural
                  Network Acoustic Models},
  booktitle    = {Interspeech 2018, 19th Annual Conference of the International Speech
                  Communication Association, Hyderabad, India, 2-6 September 2018},
  pages        = {3028--3032},
  publisher    = {{ISCA}},
  year         = {2018},
  url          = {https://doi.org/10.21437/Interspeech.2018-2566},
  doi          = {10.21437/INTERSPEECH.2018-2566},
  timestamp    = {Mon, 24 Apr 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/KimVNB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/slt/NarayananMSPTEH18,
  author       = {Arun Narayanan and
                  Ananya Misra and
                  Khe Chai Sim and
                  Golan Pundak and
                  Anshuman Tripathi and
                  Mohamed Elfeky and
                  Parisa Haghani and
                  Trevor Strohman and
                  Michiel Bacchiani},
  title        = {Toward Domain-Invariant Speech Recognition via Large Scale Training},
  booktitle    = {2018 {IEEE} Spoken Language Technology Workshop, {SLT} 2018, Athens,
                  Greece, December 18-21, 2018},
  pages        = {441--447},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/SLT.2018.8639610},
  doi          = {10.1109/SLT.2018.8639610},
  timestamp    = {Tue, 30 Mar 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/slt/NarayananMSPTEH18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/slt/HaghaniNBCGMPQW18,
  author       = {Parisa Haghani and
                  Arun Narayanan and
                  Michiel Bacchiani and
                  Galen Chuang and
                  Neeraj Gaur and
                  Pedro J. Moreno and
                  Rohit Prabhavalkar and
                  Zhongdi Qu and
                  Austin Waters},
  title        = {From Audio to Semantics: Approaches to End-to-End Spoken Language
                  Understanding},
  booktitle    = {2018 {IEEE} Spoken Language Technology Workshop, {SLT} 2018, Athens,
                  Greece, December 18-21, 2018},
  pages        = {720--726},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/SLT.2018.8639043},
  doi          = {10.1109/SLT.2018.8639043},
  timestamp    = {Wed, 26 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/slt/HaghaniNBCGMPQW18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1808-05312,
  author       = {Arun Narayanan and
                  Ananya Misra and
                  Khe Chai Sim and
                  Golan Pundak and
                  Anshuman Tripathi and
                  Mohamed Elfeky and
                  Parisa Haghani and
                  Trevor Strohman and
                  Michiel Bacchiani},
  title        = {Toward domain-invariant speech recognition via large scale training},
  journal      = {CoRR},
  volume       = {abs/1808.05312},
  year         = {2018},
  url          = {http://arxiv.org/abs/1808.05312},
  eprinttype    = {arXiv},
  eprint       = {1808.05312},
  timestamp    = {Tue, 30 Mar 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1808-05312.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1809-09190,
  author       = {Parisa Haghani and
                  Arun Narayanan and
                  Michiel Bacchiani and
                  Galen Chuang and
                  Neeraj Gaur and
                  Pedro J. Moreno and
                  Rohit Prabhavalkar and
                  Zhongdi Qu and
                  Austin Waters},
  title        = {From Audio to Semantics: Approaches to end-to-end spoken language
                  understanding},
  journal      = {CoRR},
  volume       = {abs/1809.09190},
  year         = {2018},
  url          = {http://arxiv.org/abs/1809.09190},
  eprinttype    = {arXiv},
  eprint       = {1809.09190},
  timestamp    = {Wed, 26 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1809-09190.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/SainathWWLNVBSS17,
  author       = {Tara N. Sainath and
                  Ron J. Weiss and
                  Kevin W. Wilson and
                  Bo Li and
                  Arun Narayanan and
                  Ehsan Variani and
                  Michiel Bacchiani and
                  Izhak Shafran and
                  Andrew W. Senior and
                  Kean K. Chin and
                  Ananya Misra and
                  Chanwoo Kim},
  title        = {Multichannel Signal Processing With Deep Neural Networks for Automatic
                  Speech Recognition},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {25},
  number       = {5},
  pages        = {965--979},
  year         = {2017},
  url          = {https://doi.org/10.1109/TASLP.2017.2672401},
  doi          = {10.1109/TASLP.2017.2672401},
  timestamp    = {Mon, 24 Apr 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/taslp/SainathWWLNVBSS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/asru/SimNBSB17,
  author       = {Khe Chai Sim and
                  Arun Narayanan and
                  Tom Bagby and
                  Tara N. Sainath and
                  Michiel Bacchiani},
  title        = {Improving the efficiency of forward-backward algorithm using batched
                  computation in TensorFlow},
  booktitle    = {2017 {IEEE} Automatic Speech Recognition and Understanding Workshop,
                  {ASRU} 2017, Okinawa, Japan, December 16-20, 2017},
  pages        = {258--264},
  publisher    = {{IEEE}},
  year         = {2017},
  url          = {https://doi.org/10.1109/ASRU.2017.8268944},
  doi          = {10.1109/ASRU.2017.8268944},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/asru/SimNBSB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/KimMCHNSB17,
  author       = {Chanwoo Kim and
                  Ananya Misra and
                  Kean K. Chin and
                  Thad Hughes and
                  Arun Narayanan and
                  Tara N. Sainath and
                  Michiel Bacchiani},
  editor       = {Francisco Lacerda},
  title        = {Generation of Large-Scale Simulated Utterances in Virtual Rooms to
                  Train Deep-Neural Networks for Far-Field Speech Recognition in Google
                  Home},
  booktitle    = {Interspeech 2017, 18th Annual Conference of the International Speech
                  Communication Association, Stockholm, Sweden, August 20-24, 2017},
  pages        = {379--383},
  publisher    = {{ISCA}},
  year         = {2017},
  url          = {https://doi.org/10.21437/Interspeech.2017-1510},
  doi          = {10.21437/INTERSPEECH.2017-1510},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/KimMCHNSB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/LiSNCBMSSPCSWWV17,
  author       = {Bo Li and
                  Tara N. Sainath and
                  Arun Narayanan and
                  Joe Caroselli and
                  Michiel Bacchiani and
                  Ananya Misra and
                  Izhak Shafran and
                  Hasim Sak and
                  Golan Pundak and
                  Kean K. Chin and
                  Khe Chai Sim and
                  Ron J. Weiss and
                  Kevin W. Wilson and
                  Ehsan Variani and
                  Chanwoo Kim and
                  Olivier Siohan and
                  Mitchel Weintraub and
                  Erik McDermott and
                  Richard Rose and
                  Matt Shannon},
  editor       = {Francisco Lacerda},
  title        = {Acoustic Modeling for Google Home},
  booktitle    = {Interspeech 2017, 18th Annual Conference of the International Speech
                  Communication Association, Stockholm, Sweden, August 20-24, 2017},
  pages        = {399--403},
  publisher    = {{ISCA}},
  year         = {2017},
  url          = {https://doi.org/10.21437/Interspeech.2017-234},
  doi          = {10.21437/INTERSPEECH.2017-234},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/LiSNCBMSSPCSWWV17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/VarianiBMB17,
  author       = {Ehsan Variani and
                  Tom Bagby and
                  Erik McDermott and
                  Michiel Bacchiani},
  editor       = {Francisco Lacerda},
  title        = {End-to-End Training of Acoustic Models for Large Vocabulary Continuous
                  Speech Recognition with TensorFlow},
  booktitle    = {Interspeech 2017, 18th Annual Conference of the International Speech
                  Communication Association, Stockholm, Sweden, August 20-24, 2017},
  pages        = {1641--1645},
  publisher    = {{ISCA}},
  year         = {2017},
  url          = {https://doi.org/10.21437/Interspeech.2017-1284},
  doi          = {10.21437/INTERSPEECH.2017-1284},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/VarianiBMB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@incollection{DBLP:books/sp/17/SainathWWNBLVSSCMK17,
  author       = {Tara N. Sainath and
                  Ron J. Weiss and
                  Kevin W. Wilson and
                  Arun Narayanan and
                  Michiel Bacchiani and
                  Bo Li and
                  Ehsan Variani and
                  Izhak Shafran and
                  Andrew W. Senior and
                  Kean K. Chin and
                  Ananya Misra and
                  Chanwoo Kim},
  editor       = {Shinji Watanabe and
                  Marc Delcroix and
                  Florian Metze and
                  John R. Hershey},
  title        = {Raw Multichannel Processing Using Deep Neural Networks},
  booktitle    = {New Era for Robust Speech Recognition, Exploiting Deep Learning},
  pages        = {105--133},
  publisher    = {Springer},
  year         = {2017},
  url          = {https://doi.org/10.1007/978-3-319-64680-0\_5},
  doi          = {10.1007/978-3-319-64680-0\_5},
  timestamp    = {Mon, 24 Apr 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/books/sp/17/SainathWWNBLVSSCMK17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@incollection{DBLP:books/sp/17/BacchianiBGMSSZ17,
  author       = {Michiel Bacchiani and
                  Fran{\c{c}}oise Beaufays and
                  Alexander Gruenstein and
                  Pedro J. Moreno and
                  Johan Schalkwyk and
                  Trevor Strohman and
                  Heiga Zen},
  editor       = {Shinji Watanabe and
                  Marc Delcroix and
                  Florian Metze and
                  John R. Hershey},
  title        = {Speech Research at Google to Enable Universal Speech Interfaces},
  booktitle    = {New Era for Robust Speech Recognition, Exploiting Deep Learning},
  pages        = {385--399},
  publisher    = {Springer},
  year         = {2017},
  url          = {https://doi.org/10.1007/978-3-319-64680-0\_18},
  doi          = {10.1007/978-3-319-64680-0\_18},
  timestamp    = {Wed, 26 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/books/sp/17/BacchianiBGMSSZ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1712-01541,
  author       = {Bo Li and
                  Tara N. Sainath and
                  Khe Chai Sim and
                  Michiel Bacchiani and
                  Eugene Weinstein and
                  Patrick Nguyen and
                  Zhifeng Chen and
                  Yonghui Wu and
                  Kanishka Rao},
  title        = {Multi-Dialect Speech Recognition With {A} Single Sequence-To-Sequence
                  Model},
  journal      = {CoRR},
  volume       = {abs/1712.01541},
  year         = {2017},
  url          = {http://arxiv.org/abs/1712.01541},
  eprinttype    = {arXiv},
  eprint       = {1712.01541},
  timestamp    = {Wed, 28 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1712-01541.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1712-01769,
  author       = {Chung{-}Cheng Chiu and
                  Tara N. Sainath and
                  Yonghui Wu and
                  Rohit Prabhavalkar and
                  Patrick Nguyen and
                  Zhifeng Chen and
                  Anjuli Kannan and
                  Ron J. Weiss and
                  Kanishka Rao and
                  Katya Gonina and
                  Navdeep Jaitly and
                  Bo Li and
                  Jan Chorowski and
                  Michiel Bacchiani},
  title        = {State-of-the-art Speech Recognition With Sequence-to-Sequence Models},
  journal      = {CoRR},
  volume       = {abs/1712.01769},
  year         = {2017},
  url          = {http://arxiv.org/abs/1712.01769},
  eprinttype    = {arXiv},
  eprint       = {1712.01769},
  timestamp    = {Wed, 28 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1712-01769.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1712-03439,
  author       = {Chanwoo Kim and
                  Ehsan Variani and
                  Arun Narayanan and
                  Michiel Bacchiani},
  title        = {Efficient Implementation of the Room Simulator for Training Deep Neural
                  Network Acoustic Models},
  journal      = {CoRR},
  volume       = {abs/1712.03439},
  year         = {2017},
  url          = {http://arxiv.org/abs/1712.03439},
  eprinttype    = {arXiv},
  eprint       = {1712.03439},
  timestamp    = {Mon, 24 Apr 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1712-03439.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/SainathWWNB16,
  author       = {Tara N. Sainath and
                  Ron J. Weiss and
                  Kevin W. Wilson and
                  Arun Narayanan and
                  Michiel Bacchiani},
  title        = {Factored spatial and spectral multichannel raw waveform CLDNNs},
  booktitle    = {2016 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2016, Shanghai, China, March 20-25, 2016},
  pages        = {5075--5079},
  publisher    = {{IEEE}},
  year         = {2016},
  url          = {https://doi.org/10.1109/ICASSP.2016.7472644},
  doi          = {10.1109/ICASSP.2016.7472644},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/SainathWWNB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/VarianiSSB16,
  author       = {Ehsan Variani and
                  Tara N. Sainath and
                  Izhak Shafran and
                  Michiel Bacchiani},
  editor       = {Nelson Morgan},
  title        = {Complex Linear Projection {(CLP):} {A} Discriminative Approach to
                  Joint Feature Extraction and Acoustic Modeling},
  booktitle    = {Interspeech 2016, 17th Annual Conference of the International Speech
                  Communication Association, San Francisco, CA, USA, September 8-12,
                  2016},
  pages        = {808--812},
  publisher    = {{ISCA}},
  year         = {2016},
  url          = {https://doi.org/10.21437/Interspeech.2016-1459},
  doi          = {10.21437/INTERSPEECH.2016-1459},
  timestamp    = {Mon, 26 Jun 2023 16:43:56 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/VarianiSSB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/SainathNWVWBS16,
  author       = {Tara N. Sainath and
                  Arun Narayanan and
                  Ron J. Weiss and
                  Ehsan Variani and
                  Kevin W. Wilson and
                  Michiel Bacchiani and
                  Izhak Shafran},
  editor       = {Nelson Morgan},
  title        = {Reducing the Computational Complexity of Multimicrophone Acoustic
                  Models with Integrated Feature Extraction},
  booktitle    = {Interspeech 2016, 17th Annual Conference of the International Speech
                  Communication Association, San Francisco, CA, USA, September 8-12,
                  2016},
  pages        = {1971--1975},
  publisher    = {{ISCA}},
  year         = {2016},
  url          = {https://doi.org/10.21437/Interspeech.2016-92},
  doi          = {10.21437/INTERSPEECH.2016-92},
  timestamp    = {Fri, 29 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/SainathNWVWBS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/LiSWWB16,
  author       = {Bo Li and
                  Tara N. Sainath and
                  Ron J. Weiss and
                  Kevin W. Wilson and
                  Michiel Bacchiani},
  editor       = {Nelson Morgan},
  title        = {Neural Network Adaptive Beamforming for Robust Multichannel Speech
                  Recognition},
  booktitle    = {Interspeech 2016, 17th Annual Conference of the International Speech
                  Communication Association, San Francisco, CA, USA, September 8-12,
                  2016},
  pages        = {1976--1980},
  publisher    = {{ISCA}},
  year         = {2016},
  url          = {https://doi.org/10.21437/Interspeech.2016-173},
  doi          = {10.21437/INTERSPEECH.2016-173},
  timestamp    = {Fri, 29 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/LiSWWB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/asru/SainathWWNBS15,
  author       = {Tara N. Sainath and
                  Ron J. Weiss and
                  Kevin W. Wilson and
                  Arun Narayanan and
                  Michiel Bacchiani and
                  Andrew W. Senior},
  title        = {Speaker location and microphone spacing invariant acoustic modeling
                  from raw multichannel waveforms},
  booktitle    = {2015 {IEEE} Workshop on Automatic Speech Recognition and Understanding,
                  {ASRU} 2015, Scottsdale, AZ, USA, December 13-17, 2015},
  pages        = {30--36},
  publisher    = {{IEEE}},
  year         = {2015},
  url          = {https://doi.org/10.1109/ASRU.2015.7404770},
  doi          = {10.1109/ASRU.2015.7404770},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/asru/SainathWWNBS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/LiaoPSCCJSSBB15,
  author       = {Hank Liao and
                  Golan Pundak and
                  Olivier Siohan and
                  Melissa K. Carroll and
                  Noah Coccaro and
                  Qi{-}Ming Jiang and
                  Tara N. Sainath and
                  Andrew W. Senior and
                  Fran{\c{c}}oise Beaufays and
                  Michiel Bacchiani},
  title        = {Large vocabulary automatic speech recognition for children},
  booktitle    = {{INTERSPEECH} 2015, 16th Annual Conference of the International Speech
                  Communication Association, Dresden, Germany, September 6-10, 2015},
  pages        = {1611--1615},
  publisher    = {{ISCA}},
  year         = {2015},
  url          = {https://doi.org/10.21437/Interspeech.2015-373},
  doi          = {10.21437/INTERSPEECH.2015-373},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/LiaoPSCCJSSBB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/BacchianiR14,
  author       = {Michiel Bacchiani and
                  David Rybach},
  title        = {Context dependent state tying for speech recognition using deep neural
                  network acoustic models},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2014, Florence, Italy, May 4-9, 2014},
  pages        = {230--234},
  publisher    = {{IEEE}},
  year         = {2014},
  url          = {https://doi.org/10.1109/ICASSP.2014.6853592},
  doi          = {10.1109/ICASSP.2014.6853592},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/BacchianiR14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/HeigoldMVSB14,
  author       = {Georg Heigold and
                  Erik McDermott and
                  Vincent Vanhoucke and
                  Andrew W. Senior and
                  Michiel Bacchiani},
  title        = {Asynchronous stochastic optimization for sequence training of deep
                  neural networks},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2014, Florence, Italy, May 4-9, 2014},
  pages        = {5587--5591},
  publisher    = {{IEEE}},
  year         = {2014},
  url          = {https://doi.org/10.1109/ICASSP.2014.6854672},
  doi          = {10.1109/ICASSP.2014.6854672},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/HeigoldMVSB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/SeniorHBL14,
  author       = {Andrew W. Senior and
                  Georg Heigold and
                  Michiel Bacchiani and
                  Hank Liao},
  title        = {GMM-free {DNN} acoustic model training},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2014, Florence, Italy, May 4-9, 2014},
  pages        = {5602--5606},
  publisher    = {{IEEE}},
  year         = {2014},
  url          = {https://doi.org/10.1109/ICASSP.2014.6854675},
  doi          = {10.1109/ICASSP.2014.6854675},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/SeniorHBL14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/McDermottHMSB14,
  author       = {Erik McDermott and
                  Georg Heigold and
                  Pedro J. Moreno and
                  Andrew W. Senior and
                  Michiel Bacchiani},
  editor       = {Haizhou Li and
                  Helen M. Meng and
                  Bin Ma and
                  Engsiong Chng and
                  Lei Xie},
  title        = {Asynchronous stochastic optimization for sequence training of deep
                  neural networks: towards big data},
  booktitle    = {{INTERSPEECH} 2014, 15th Annual Conference of the International Speech
                  Communication Association, Singapore, September 14-18, 2014},
  pages        = {1224--1228},
  publisher    = {{ISCA}},
  year         = {2014},
  url          = {https://doi.org/10.21437/Interspeech.2014-308},
  doi          = {10.21437/INTERSPEECH.2014-308},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/McDermottHMSB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/BacchianiSH14,
  author       = {Michiel Bacchiani and
                  Andrew W. Senior and
                  Georg Heigold},
  editor       = {Haizhou Li and
                  Helen M. Meng and
                  Bin Ma and
                  Engsiong Chng and
                  Lei Xie},
  title        = {Asynchronous, online, GMM-free training of a context dependent acoustic
                  model for speech recognition},
  booktitle    = {{INTERSPEECH} 2014, 15th Annual Conference of the International Speech
                  Communication Association, Singapore, September 14-18, 2014},
  pages        = {1900--1904},
  publisher    = {{ISCA}},
  year         = {2014},
  url          = {https://doi.org/10.21437/Interspeech.2014-430},
  doi          = {10.21437/INTERSPEECH.2014-430},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/BacchianiSH14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/KimCBS14,
  author       = {Chanwoo Kim and
                  Kean K. Chin and
                  Michiel Bacchiani and
                  Richard M. Stern},
  editor       = {Haizhou Li and
                  Helen M. Meng and
                  Bin Ma and
                  Engsiong Chng and
                  Lei Xie},
  title        = {Robust speech recognition using temporal masking and thresholding
                  algorithm},
  booktitle    = {{INTERSPEECH} 2014, 15th Annual Conference of the International Speech
                  Communication Association, Singapore, September 14-18, 2014},
  pages        = {2734--2738},
  publisher    = {{ISCA}},
  year         = {2014},
  url          = {https://doi.org/10.21437/Interspeech.2014-157},
  doi          = {10.21437/INTERSPEECH.2014-157},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/KimCBS14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/Bacchiani13,
  author       = {Michiel Bacchiani},
  title        = {Rapid adaptation for mobile speech applications},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2013, Vancouver, BC, Canada, May 26-31, 2013},
  pages        = {7903--7907},
  publisher    = {{IEEE}},
  year         = {2013},
  url          = {https://doi.org/10.1109/ICASSP.2013.6639203},
  doi          = {10.1109/ICASSP.2013.6639203},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/Bacchiani13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/SiohanB13,
  author       = {Olivier Siohan and
                  Michiel Bacchiani},
  editor       = {Fr{\'{e}}d{\'{e}}ric Bimbot and
                  Christophe Cerisara and
                  C{\'{e}}cile Fougeron and
                  Guillaume Gravier and
                  Lori Lamel and
                  Fran{\c{c}}ois Pellegrino and
                  Pascal Perrier},
  title        = {ivector-based acoustic data selection},
  booktitle    = {{INTERSPEECH} 2013, 14th Annual Conference of the International Speech
                  Communication Association, Lyon, France, August 25-29, 2013},
  pages        = {657--661},
  publisher    = {{ISCA}},
  year         = {2013},
  url          = {https://doi.org/10.21437/Interspeech.2013-188},
  doi          = {10.21437/INTERSPEECH.2013-188},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/SiohanB13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/spm/LiuB11,
  author       = {Zhu Liu and
                  Michiel Bacchiani},
  title        = {TechWare: Mobile Media Search Resources [Best of the Web]},
  journal      = {{IEEE} Signal Process. Mag.},
  volume       = {28},
  number       = {4},
  pages        = {142--145},
  year         = {2011},
  url          = {https://doi.org/10.1109/MSP.2011.941095},
  doi          = {10.1109/MSP.2011.941095},
  timestamp    = {Thu, 21 Dec 2017 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/spm/LiuB11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/AlbertiB11,
  author       = {Christopher Alberti and
                  Michiel Bacchiani},
  title        = {Discriminative Features for Language Identification},
  booktitle    = {{INTERSPEECH} 2011, 12th Annual Conference of the International Speech
                  Communication Association, Florence, Italy, August 27-31, 2011},
  pages        = {2917--2920},
  publisher    = {{ISCA}},
  year         = {2011},
  url          = {https://doi.org/10.21437/Interspeech.2011-730},
  doi          = {10.21437/INTERSPEECH.2011-730},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/AlbertiB11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/LiaoABS10,
  author       = {Hank Liao and
                  Christopher Alberti and
                  Michiel Bacchiani and
                  Olivier Siohan},
  editor       = {Takao Kobayashi and
                  Keikichi Hirose and
                  Satoshi Nakamura},
  title        = {Decision tree state clustering with word and syllable features},
  booktitle    = {{INTERSPEECH} 2010, 11th Annual Conference of the International Speech
                  Communication Association, Makuhari, Chiba, Japan, September 26-30,
                  2010},
  pages        = {2958--2961},
  publisher    = {{ISCA}},
  year         = {2010},
  url          = {https://doi.org/10.21437/Interspeech.2010-28},
  doi          = {10.21437/INTERSPEECH.2010-28},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/LiaoABS10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/GravanoJB09,
  author       = {Agust{\'{\i}}n Gravano and
                  Martin Jansche and
                  Michiel Bacchiani},
  title        = {Restoring punctuation and capitalization in transcribed speech},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2009, 19-24 April 2009, Taipei, Taiwan},
  pages        = {4741--4744},
  publisher    = {{IEEE}},
  year         = {2009},
  url          = {https://doi.org/10.1109/ICASSP.2009.4960690},
  doi          = {10.1109/ICASSP.2009.4960690},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/GravanoJB09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/AlbertiBBCDLMPSSS09,
  author       = {Christopher Alberti and
                  Michiel Bacchiani and
                  Ari Bezman and
                  Ciprian Chelba and
                  Anastassia Drofa and
                  Hank Liao and
                  Pedro J. Moreno and
                  Ted Power and
                  Arnaud Sahuguet and
                  Maria Shugrina and
                  Olivier Siohan},
  title        = {An audio indexing system for election video material},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2009, 19-24 April 2009, Taipei, Taiwan},
  pages        = {4873--4876},
  publisher    = {{IEEE}},
  year         = {2009},
  url          = {https://doi.org/10.1109/ICASSP.2009.4960723},
  doi          = {10.1109/ICASSP.2009.4960723},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/AlbertiBBCDLMPSSS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/GollanB08,
  author       = {Christian Gollan and
                  Michiel Bacchiani},
  title        = {Confidence scores for acoustic model adaptation},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2008, March 30 - April 4, 2008, Caesars
                  Palace, Las Vegas, Nevada, {USA}},
  pages        = {4289--4292},
  publisher    = {{IEEE}},
  year         = {2008},
  url          = {https://doi.org/10.1109/ICASSP.2008.4518603},
  doi          = {10.1109/ICASSP.2008.4518603},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/GollanB08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/BacchianiBSSS08,
  author       = {Michiel Bacchiani and
                  Fran{\c{c}}oise Beaufays and
                  Johan Schalkwyk and
                  Mike Schuster and
                  Brian Strope},
  title        = {Deploying {GOOG-411:} Early lessons in data, measurement, and testing},
  booktitle    = {Proceedings of the {IEEE} International Conference on Acoustics, Speech,
                  and Signal Processing, {ICASSP} 2008, March 30 - April 4, 2008, Caesars
                  Palace, Las Vegas, Nevada, {USA}},
  pages        = {5260--5263},
  publisher    = {{IEEE}},
  year         = {2008},
  url          = {https://doi.org/10.1109/ICASSP.2008.4518846},
  doi          = {10.1109/ICASSP.2008.4518846},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/BacchianiBSSS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/csl/BacchianiRRS06,
  author       = {Michiel Bacchiani and
                  Michael Riley and
                  Brian Roark and
                  Richard Sproat},
  title        = {{MAP} adaptation of stochastic grammars},
  journal      = {Comput. Speech Lang.},
  volume       = {20},
  number       = {1},
  pages        = {41--68},
  year         = {2006},
  url          = {https://doi.org/10.1016/j.csl.2004.12.001},
  doi          = {10.1016/J.CSL.2004.12.001},
  timestamp    = {Thu, 20 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/csl/BacchianiRRS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/SiohanB05,
  author       = {Olivier Siohan and
                  Michiel Bacchiani},
  title        = {Fast vocabulary-independent audio search using path-based graph indexing},
  booktitle    = {{INTERSPEECH} 2005 - Eurospeech, 9th European Conference on Speech
                  Communication and Technology, Lisbon, Portugal, September 4-8, 2005},
  pages        = {53--56},
  publisher    = {{ISCA}},
  year         = {2005},
  url          = {https://doi.org/10.21437/Interspeech.2005-52},
  doi          = {10.21437/INTERSPEECH.2005-52},
  timestamp    = {Thu, 22 Jun 2023 16:42:16 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/SiohanB05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/BacchianiR04,
  author       = {Michiel Bacchiani and
                  Brian Roark},
  title        = {Meta-data conditional language modeling},
  booktitle    = {2004 {IEEE} International Conference on Acoustics, Speech, and Signal
                  Processing, {ICASSP} 2004, Montreal, Quebec, Canada, May 17-21, 2004},
  pages        = {241--244},
  publisher    = {{IEEE}},
  year         = {2004},
  url          = {https://doi.org/10.1109/ICASSP.2004.1325967},
  doi          = {10.1109/ICASSP.2004.1325967},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/BacchianiR04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/MaskeyBRS04,
  author       = {Sameer Maskey and
                  Michiel Bacchiani and
                  Brian Roark and
                  Richard Sproat},
  title        = {Improved name recognition with meta-data dependent name networks},
  booktitle    = {2004 {IEEE} International Conference on Acoustics, Speech, and Signal
                  Processing, {ICASSP} 2004, Montreal, Quebec, Canada, May 17-21, 2004},
  pages        = {789--792},
  publisher    = {{IEEE}},
  year         = {2004},
  url          = {https://doi.org/10.1109/ICASSP.2004.1326104},
  doi          = {10.1109/ICASSP.2004.1326104},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/MaskeyBRS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/naacl/BacchianiRS04,
  author       = {Michiel Bacchiani and
                  Brian Roark and
                  Murat Saraclar},
  title        = {Language Model Adaptation with {MAP} Estimation and the Perceptron
                  Algorithm},
  booktitle    = {Proceedings of {HLT-NAACL} 2004: Short Papers, Boston, Massachusetts,
                  USA, May 2-7, 2004},
  publisher    = {The Association for Computational Linguistics},
  year         = {2004},
  url          = {https://aclanthology.org/N04-4006/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/naacl/BacchianiRS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/BacchianiR03,
  author       = {Michiel Bacchiani and
                  Brian Roark},
  title        = {Unsupervised language model adaptation},
  booktitle    = {2003 {IEEE} International Conference on Acoustics, Speech, and Signal
                  Processing, {ICASSP} '03, Hong Kong, April 6-10, 2003},
  pages        = {224--227},
  publisher    = {{IEEE}},
  year         = {2003},
  url          = {https://doi.org/10.1109/ICASSP.2003.1198758},
  doi          = {10.1109/ICASSP.2003.1198758},
  timestamp    = {Mon, 22 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/BacchianiR03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/naacl/RoarkB03,
  author       = {Brian Roark and
                  Michiel Bacchiani},
  editor       = {Marti A. Hearst and
                  Mari Ostendorf},
  title        = {Supervised and unsupervised {PCFG} adaptation to novel domains},
  booktitle    = {Human Language Technology Conference of the North American Chapter
                  of the Association for Computational Linguistics, {HLT-NAACL} 2003,
                  Edmonton, Canada, May 27 - June 1, 2003},
  publisher    = {The Association for Computational Linguistics},
  year         = {2003},
  url          = {https://aclanthology.org/N03-1027/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/naacl/RoarkB03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/chi/WhittakerHASBISZR02,
  author       = {Steve Whittaker and
                  Julia Hirschberg and
                  Brian Amento and
                  Litza A. Stark and
                  Michiel Bacchiani and
                  Philip L. Isenhour and
                  Larry Stead and
                  Gary Zamchick and
                  Aaron E. Rosenberg},
  editor       = {Dennis R. Wixon},
  title        = {SCANMail: a voicemail interface that makes speech browsable, readable
                  and searchable},
  booktitle    = {Proceedings of the {CHI} 2002 Conference on Human Factors in Computing
                  Systems: Changing our World, Changing ourselves, Minneapolis, Minnesota,
                  USA, April 20-25, 2002},
  pages        = {275--282},
  publisher    = {{ACM}},
  year         = {2002},
  url          = {https://doi.org/10.1145/503376.503426},
  doi          = {10.1145/503376.503426},
  timestamp    = {Mon, 11 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/chi/WhittakerHASBISZR02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/Bacchiani02,
  author       = {Michiel Bacchiani},
  editor       = {John H. L. Hansen and
                  Bryan L. Pellom},
  title        = {Combining maximum likelihood and maximum a posteriori estimation for
                  detailed acoustic modeling of context dependency},
  booktitle    = {7th International Conference on Spoken Language Processing, {ICSLP2002}
                  - {INTERSPEECH} 2002, Denver, Colorado, USA, September 16-20, 2002},
  pages        = {2593--2596},
  publisher    = {{ISCA}},
  year         = {2002},
  url          = {https://doi.org/10.21437/ICSLP.2002-344},
  doi          = {10.21437/ICSLP.2002-344},
  timestamp    = {Thu, 22 Jun 2023 16:42:18 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/Bacchiani02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/Bacchiani01,
  author       = {Michiel Bacchiani},
  title        = {Automatic transcription of voicemail at AT{\&}T},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech, and Signal Processing,
                  {ICASSP} 2001, 7-11 May, 2001, Salt Palace Convention Center, Salt
                  Lake City, Utah, USA, Proceedings},
  pages        = {25--28},
  publisher    = {{IEEE}},
  year         = {2001},
  url          = {https://doi.org/10.1109/ICASSP.2001.940758},
  doi          = {10.1109/ICASSP.2001.940758},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/Bacchiani01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/HirschbergBHIRSSWZ01,
  author       = {Julia Hirschberg and
                  Michiel Bacchiani and
                  Donald Hindle and
                  Philip L. Isenhour and
                  Aaron E. Rosenberg and
                  Litza A. Stark and
                  Larry Stead and
                  Steve Whittaker and
                  Gary Zamchick},
  editor       = {Paul Dalsgaard and
                  B{\o}rge Lindberg and
                  Henrik Benner and
                  Zheng{-}Hua Tan},
  title        = {SCANMail: browsing and searching speech data by content},
  booktitle    = {{EUROSPEECH} 2001 Scandinavia, 7th European Conference on Speech Communication
                  and Technology, 2nd {INTERSPEECH} Event, Aalborg, Denmark, September
                  3-7, 2001},
  pages        = {1299--1302},
  publisher    = {{ISCA}},
  year         = {2001},
  url          = {https://doi.org/10.21437/Eurospeech.2001-336},
  doi          = {10.21437/EUROSPEECH.2001-336},
  timestamp    = {Thu, 22 Jun 2023 16:42:18 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/HirschbergBHIRSSWZ01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/RosenbergHBPIS01,
  author       = {Aaron E. Rosenberg and
                  Julia Hirschberg and
                  Michiel Bacchiani and
                  Sarangarajan Parthasarathy and
                  Philip L. Isenhour and
                  Larry Stead},
  editor       = {Paul Dalsgaard and
                  B{\o}rge Lindberg and
                  Henrik Benner and
                  Zheng{-}Hua Tan},
  title        = {Caller identification for the SCANMail voicemail browser},
  booktitle    = {{EUROSPEECH} 2001 Scandinavia, 7th European Conference on Speech Communication
                  and Technology, 2nd {INTERSPEECH} Event, Aalborg, Denmark, September
                  3-7, 2001},
  pages        = {2373--2376},
  publisher    = {{ISCA}},
  year         = {2001},
  url          = {https://doi.org/10.21437/Eurospeech.2001-559},
  doi          = {10.21437/EUROSPEECH.2001-559},
  timestamp    = {Thu, 22 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/RosenbergHBPIS01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/naacl/BacchianiHRWHIJ01,
  author       = {Michiel Bacchiani and
                  Julia Hirschberg and
                  Aaron E. Rosenberg and
                  Steve Whittaker and
                  Donald Hindle and
                  Philip L. Isenhour and
                  Matt Jones and
                  Litza A. Stark and
                  Gary Zamchick},
  title        = {SCANMail: Audio Navigation in the Voicemail Domain},
  booktitle    = {Proceedings of the First International Conference on Human Language
                  Technology Research, {HLT} 2001, San Diego, California, USA, March
                  18-21, 2001},
  publisher    = {Morgan Kaufmann},
  year         = {2001},
  url          = {https://aclanthology.org/H01-1064/},
  timestamp    = {Mon, 11 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/naacl/BacchianiHRWHIJ01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nlprs/HirschbergBI01,
  author       = {Julia Hirschberg and
                  Michiel Bacchiani and
                  Philip L. Isenhour},
  title        = {Audio Browsing and Search in the Voicemail Domain},
  booktitle    = {Proceedings of the Sixth Natural Language Processing Pacific Rim Symposium,
                  November 27-30, 2001, Hitotsubashi Memorial Hall, National Center
                  of Sciences, Tokyo, Japan},
  pages        = {3--8},
  year         = {2001},
  url          = {http://www.afnlp.org/nlprs2001/pdf/inv-01-01.pdf},
  timestamp    = {Thu, 04 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nlprs/HirschbergBI01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/Bacchiani00,
  author       = {Michiel Bacchiani},
  title        = {Using maximum likelihood linear regression for segment clustering
                  and speaker identification},
  booktitle    = {Sixth International Conference on Spoken Language Processing, {ICSLP}
                  2000 / {INTERSPEECH} 2000, Beijing, China, October 16-20, 2000},
  pages        = {536--539},
  publisher    = {{ISCA}},
  year         = {2000},
  url          = {https://doi.org/10.21437/ICSLP.2000-867},
  doi          = {10.21437/ICSLP.2000-867},
  timestamp    = {Thu, 22 Jun 2023 16:42:19 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/Bacchiani00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/speech/BacchianiO99,
  author       = {Michiel Bacchiani and
                  Mari Ostendorf},
  title        = {Joint lexicon, acoustic unit inventory and model design},
  journal      = {Speech Commun.},
  volume       = {29},
  number       = {2-4},
  pages        = {99--114},
  year         = {1999},
  url          = {https://doi.org/10.1016/S0167-6393(99)00033-3},
  doi          = {10.1016/S0167-6393(99)00033-3},
  timestamp    = {Sat, 22 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/speech/BacchianiO99.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/trec/SinghalABCHP99,
  author       = {Amit Singhal and
                  Steven P. Abney and
                  Michiel Bacchiani and
                  Michael Collins and
                  Donald Hindle and
                  Fernando C. N. Pereira},
  editor       = {Ellen M. Voorhees and
                  Donna K. Harman},
  title        = {AT{\&}T at {TREC-8}},
  booktitle    = {Proceedings of The Eighth Text REtrieval Conference, {TREC} 1999,
                  Gaithersburg, Maryland, USA, November 17-19, 1999},
  series       = {{NIST} Special Publication},
  volume       = {500-246},
  publisher    = {National Institute of Standards and Technology {(NIST)}},
  year         = {1999},
  url          = {http://trec.nist.gov/pubs/trec8/papers/att-trec8.pdf},
  timestamp    = {Wed, 07 Jul 2021 16:44:22 +0200},
  biburl       = {https://dblp.org/rec/conf/trec/SinghalABCHP99.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/BacchianiO98,
  author       = {Michiel Bacchiani and
                  Mari Ostendorf},
  title        = {Using automatically-derived acoustic sub-word units in large vocabulary
                  speech recognition},
  booktitle    = {The 5th International Conference on Spoken Language Processing, Incorporating
                  The 7th Australian International Speech Science and Technology Conference,
                  Sydney Convention Centre, Sydney, Australia, 30th November - 4th December
                  1998},
  publisher    = {{ISCA}},
  year         = {1998},
  url          = {https://doi.org/10.21437/ICSLP.1998-629},
  doi          = {10.21437/ICSLP.1998-629},
  timestamp    = {Thu, 22 Jun 2023 16:42:19 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/BacchianiO98.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/BacchianiOSP96,
  author       = {Michiel Bacchiani and
                  Mari Ostendorf and
                  Yoshinori Sagisaka and
                  Kuldip K. Paliwal},
  title        = {Design of a speech recognition system based on acoustically derived
                  segmental units},
  booktitle    = {1996 {IEEE} International Conference on Acoustics, Speech, and Signal
                  Processing Conference Proceedings, {ICASSP} '96, Atlanta, Georgia,
                  USA, May 7-10, 1996},
  pages        = {443--446},
  publisher    = {{IEEE} Computer Society},
  year         = {1996},
  url          = {https://doi.org/10.1109/ICASSP.1996.541128},
  doi          = {10.1109/ICASSP.1996.541128},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/BacchianiOSP96.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/FukadaBPS96,
  author       = {Toshiaki Fukada and
                  Michiel Bacchiani and
                  Kuldip K. Paliwal and
                  Yoshinori Sagisaka},
  title        = {Speech recognition based on acoustically derived segment units},
  booktitle    = {The 4th International Conference on Spoken Language Processing, Philadelphia,
                  PA, USA, October 3-6, 1996},
  pages        = {1077--1080},
  publisher    = {{ISCA}},
  year         = {1996},
  url          = {https://doi.org/10.21437/ICSLP.1996-283},
  doi          = {10.21437/ICSLP.1996-283},
  timestamp    = {Thu, 22 Jun 2023 16:42:20 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/FukadaBPS96.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/PaliwalBS95,
  author       = {Kuldip K. Paliwal and
                  Michiel Bacchiani and
                  Yoshinori Sagisaka},
  title        = {Minimum classification error training algorithm for feature extractor
                  and pattern classifier in speech recognition},
  booktitle    = {Fourth European Conference on Speech Communication and Technology,
                  {EUROSPEECH} 1995, Madrid, Spain, September 18-21, 1995},
  pages        = {541--544},
  publisher    = {{ISCA}},
  year         = {1995},
  url          = {https://doi.org/10.21437/Eurospeech.1995-30},
  doi          = {10.21437/EUROSPEECH.1995-30},
  timestamp    = {Sat, 01 Jul 2023 23:51:24 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/PaliwalBS95.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/BacchianiA94,
  author       = {Michiel Bacchiani and
                  Kiyoaki Aikawa},
  title        = {Optimization of time-frequency masking filters using the minimum classification
                  error criterion},
  booktitle    = {Proceedings of {ICASSP} '94: {IEEE} International Conference on Acoustics,
                  Speech and Signal Processing, Adelaide, South Australia, Australia,
                  April 19-22, 1994},
  pages        = {197--200},
  publisher    = {{IEEE} Computer Society},
  year         = {1994},
  url          = {https://doi.org/10.1109/ICASSP.1994.389685},
  doi          = {10.1109/ICASSP.1994.389685},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/BacchianiA94.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics