Search dblp for Publications

export results for "Ramon Sanabria"

 download as .bib file

@article{DBLP:journals/corr/abs-2402-02617,
  author       = {Alexandra Saliba and
                  Yuanchao Li and
                  Ramon Sanabria and
                  Catherine Lai},
  title        = {Layer-Wise Analysis of Self-Supervised Acoustic Word Embeddings: {A}
                  Study on Speech Emotion Recognition},
  journal      = {CoRR},
  volume       = {abs/2402.02617},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2404-01616,
  author       = {Frank Palma Gomez and
                  Ramon Sanabria and
                  Yun{-}Hsuan Sung and
                  Daniel Cer and
                  Siddharth Dalmia and
                  Gustavo Hern{\'{a}}ndez {\'{A}}brego},
  title        = {Transforming LLMs into Cross-modal and Cross-lingual Retrieval Systems},
  journal      = {CoRR},
  volume       = {abs/2404.01616},
  year         = {2024}
}
@inproceedings{DBLP:conf/enc/GarciaMSPS23,
  author       = {Ricardo Garc{\'{\i}}a and
                  Soria Sergio Emmanuel Soria Medina and
                  Aldo Ram{\'{o}}n Sanabria Santiago and
                  Guillermo Rey Pe{\~{n}}aloza{-}Mendoza and
                  Carlos Alberto Trejo Ser{\'{a}}fico},
  title        = {Blood cell counting(Erythocytes) through image procesing in Matlab},
  booktitle    = {{ENC}},
  pages        = {1--5},
  year         = {2023}
}
@inproceedings{DBLP:conf/icassp/SanabriaBMCKB23,
  author       = {Ramon Sanabria and
                  Nikolay Bogoychev and
                  Nina Markl and
                  Andrea Carmantini and
                  Ondrej Klejch and
                  Peter Bell},
  title        = {The Edinburgh International Accents of English Corpus: Towards the
                  Democratization of English {ASR}},
  booktitle    = {{ICASSP}},
  pages        = {1--5},
  year         = {2023}
}
@inproceedings{DBLP:conf/icassp/SanabriaHBA23,
  author       = {Ramon Sanabria and
                  Wei{-}Ning Hsu and
                  Alexei Baevski and
                  Michael Auli},
  title        = {Measuring the Impact of Domain Factors in Self-Supervised Pre-Training},
  booktitle    = {{ICASSP} Workshops},
  pages        = {1--5},
  year         = {2023}
}
@inproceedings{DBLP:conf/icassp/SanabriaTG23,
  author       = {Ramon Sanabria and
                  Hao Tang and
                  Sharon Goldwater},
  title        = {Analyzing Acoustic Word Embeddings from Pre-Trained Self-Supervised
                  Speech Models},
  booktitle    = {{ICASSP}},
  pages        = {1--5},
  year         = {2023}
}
@inproceedings{DBLP:conf/interspeech/SanabriaKTG23,
  author       = {Ramon Sanabria and
                  Ondrej Klejch and
                  Hao Tang and
                  Sharon Goldwater},
  title        = {Acoustic Word Embeddings for Untranscribed Target Languages with Continued
                  Pretraining and Learned Pooling},
  booktitle    = {{INTERSPEECH}},
  pages        = {406--410},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2303-18110,
  author       = {Ramon Sanabria and
                  Nikolay Bogoychev and
                  Nina Markl and
                  Andrea Carmantini and
                  Ondrej Klejch and
                  Peter Bell},
  title        = {The Edinburgh International Accents of English Corpus: Towards the
                  Democratization of English {ASR}},
  journal      = {CoRR},
  volume       = {abs/2303.18110},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2306-02153,
  author       = {Ramon Sanabria and
                  Ondrej Klejch and
                  Hao Tang and
                  Sharon Goldwater},
  title        = {Acoustic Word Embeddings for Untranscribed Target Languages with Continued
                  Pretraining and Learned Pooling},
  journal      = {CoRR},
  volume       = {abs/2306.02153},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2203-00648,
  author       = {Ramon Sanabria and
                  Wei{-}Ning Hsu and
                  Alexei Baevski and
                  Michael Auli},
  title        = {Measuring the Impact of Individual Domain Factors in Self-Supervised
                  Pre-Training},
  journal      = {CoRR},
  volume       = {abs/2203.00648},
  year         = {2022}
}
@article{DBLP:journals/corr/abs-2210-16043,
  author       = {Ramon Sanabria and
                  Hao Tang and
                  Sharon Goldwater},
  title        = {Analyzing Acoustic Word Embeddings from Pre-trained Self-supervised
                  Speech Models},
  journal      = {CoRR},
  volume       = {abs/2210.16043},
  year         = {2022}
}
@inproceedings{DBLP:conf/interspeech/SanabriaWB21,
  author       = {Ramon Sanabria and
                  Austin Waters and
                  Jason Baldridge},
  title        = {Talk, Don't Write: {A} Study of Direct Speech-Based Image Retrieval},
  booktitle    = {Interspeech},
  pages        = {2976--2980},
  year         = {2021}
}
@article{DBLP:journals/corr/abs-2104-01894,
  author       = {Ramon Sanabria and
                  Austin Waters and
                  Jason Baldridge},
  title        = {Talk, Don't Write: {A} Study of Direct Speech-Based Image Retrieval},
  journal      = {CoRR},
  volume       = {abs/2104.01894},
  year         = {2021}
}
@article{DBLP:journals/corr/abs-2109-10107,
  author       = {Ramon Sanabria and
                  Hao Tang and
                  Sharon Goldwater},
  title        = {On the Difficulty of Segmenting Words with Attention},
  journal      = {CoRR},
  volume       = {abs/2109.10107},
  year         = {2021}
}
@article{DBLP:journals/csl/PalaskarSM20,
  author       = {Shruti Palaskar and
                  Ramon Sanabria and
                  Florian Metze},
  title        = {Transfer learning for multimodal dialog},
  journal      = {Comput. Speech Lang.},
  volume       = {64},
  pages        = {101093},
  year         = {2020}
}
@article{DBLP:journals/jstsp/SpeciaBCDEGHLLL20,
  author       = {Lucia Specia and
                  Lo{\"{\i}}c Barrault and
                  Ozan Caglayan and
                  Amanda Cardoso Duarte and
                  Desmond Elliott and
                  Spandana Gella and
                  Nils Holzenberger and
                  Chiraag Lala and
                  Sun Jae Lee and
                  Jindrich Libovick{\'{y}} and
                  Pranava Madhyastha and
                  Florian Metze and
                  Karl Mulligan and
                  Alissa Ostapenko and
                  Shruti Palaskar and
                  Ramon Sanabria and
                  Josiah Wang and
                  Raman Arora},
  title        = {Grounded Sequence to Sequence Transduction},
  journal      = {{IEEE} J. Sel. Top. Signal Process.},
  volume       = {14},
  number       = {3},
  pages        = {577--591},
  year         = {2020}
}
@inproceedings{DBLP:conf/emnlp/SrinivasanSME20,
  author       = {Tejas Srinivasan and
                  Ramon Sanabria and
                  Florian Metze and
                  Desmond Elliott},
  title        = {Fine-Grained Grounding for Multimodal Speech Recognition},
  booktitle    = {{EMNLP} (Findings)},
  pages        = {2667--2677},
  year         = {2020}
}
@inproceedings{DBLP:conf/icassp/SrinivasanSM20,
  author       = {Tejas Srinivasan and
                  Ramon Sanabria and
                  Florian Metze},
  title        = {Looking Enhances Listening: Recovering Missing Speech Using Images},
  booktitle    = {{ICASSP}},
  pages        = {6304--6308},
  year         = {2020}
}
@article{DBLP:journals/corr/abs-2002-05639,
  author       = {Tejas Srinivasan and
                  Ramon Sanabria and
                  Florian Metze},
  title        = {Looking Enhances Listening: Recovering Missing Speech Using Images},
  journal      = {CoRR},
  volume       = {abs/2002.05639},
  year         = {2020}
}
@article{DBLP:journals/corr/abs-2010-02384,
  author       = {Tejas Srinivasan and
                  Ramon Sanabria and
                  Florian Metze and
                  Desmond Elliott},
  title        = {Fine-Grained Grounding for Multimodal Speech Recognition},
  journal      = {CoRR},
  volume       = {abs/2010.02384},
  year         = {2020}
}
@article{DBLP:journals/corr/abs-2010-08642,
  author       = {Tejas Srinivasan and
                  Ramon Sanabria and
                  Florian Metze and
                  Desmond Elliott},
  title        = {Multimodal Speech Recognition with Unstructured Audio Masking},
  journal      = {CoRR},
  volume       = {abs/2010.08642},
  year         = {2020}
}
@inproceedings{DBLP:conf/icassp/CaglayanSPBM19,
  author       = {Ozan Caglayan and
                  Ramon Sanabria and
                  Shruti Palaskar and
                  Lo{\"{\i}}c Barrault and
                  Florian Metze},
  title        = {Multimodal Grounding for Sequence-to-sequence Speech Recognition},
  booktitle    = {{ICASSP}},
  pages        = {8648--8652},
  year         = {2019}
}
@inproceedings{DBLP:conf/iwslt/NiehuesCSNTHSSB19,
  author       = {Jan Niehues and
                  Roldano Cattoni and
                  Sebastian St{\"{u}}ker and
                  Matteo Negri and
                  Marco Turchi and
                  Thanh{-}Le Ha and
                  Elizabeth Salesky and
                  Ramon Sanabria and
                  Lo{\"{\i}}c Barrault and
                  Lucia Specia and
                  Marcello Federico},
  title        = {The {IWSLT} 2019 Evaluation Campaign},
  booktitle    = {{IWSLT}},
  year         = {2019}
}
@inproceedings{DBLP:conf/iwslt/SrinivasanSM19,
  author       = {Tejas Srinivasan and
                  Ramon Sanabria and
                  Florian Metze},
  title        = {CMU's Machine Translation System for {IWSLT} 2019},
  booktitle    = {{IWSLT}},
  year         = {2019}
}
@inproceedings{DBLP:conf/iwslt/SrinivasanSM19a,
  author       = {Tejas Srinivasan and
                  Ramon Sanabria and
                  Florian Metze},
  title        = {Multitask Learning For Different Subword Segmentations In Neural Machine
                  Translation},
  booktitle    = {{IWSLT}},
  year         = {2019}
}
@inproceedings{DBLP:conf/mediaeval/MoriyaSMJ19,
  author       = {Yasufumi Moriya and
                  Ramon Sanabria and
                  Florian Metze and
                  Gareth J. F. Jones},
  title        = {MediaEval 2019: Eyes and Ears Together},
  booktitle    = {MediaEval},
  year         = {2019}
}
@proceedings{DBLP:conf/iwslt/2019,
  editor       = {Jan Niehues and
                  Roldano Cattoni and
                  Sebastian St{\"{u}}ker and
                  Matteo Negri and
                  Marco Turchi and
                  Thanh{-}Le Ha and
                  Elizabeth Salesky and
                  Ramon Sanabria and
                  Lo{\"{\i}}c Barrault and
                  Lucia Specia and
                  Marcello Federico},
  title        = {Proceedings of the 16th International Conference on Spoken Language
                  Translation, {IWSLT} 2019, Hong Kong, November 2-3, 2019},
  publisher    = {Association for Computational Linguistics},
  year         = {2019}
}
@inproceedings{DBLP:conf/tac/HovyCCGHMMSDCCK19,
  author       = {Eduard H. Hovy and
                  Jaime G. Carbonell and
                  Hans Chalupsky and
                  Anatole Gershman and
                  Alex Hauptmann and
                  Florian Metze and
                  Teruko Mitamura and
                  Zaid Sheikh and
                  Ankit Dangi and
                  Aditi Chaudhary and
                  Xianyang Chen and
                  Xiang Kong and
                  Bernie Huang and
                  Salvador Medina and
                  Hector Liu and
                  Xuezhe Ma and
                  Maria Ryskina and
                  Ramon Sanabria and
                  Varun Gangal},
  title        = {{OPERA:} Operations-oriented Probabilistic Extraction, Reasoning,
                  and Analysis},
  booktitle    = {{TAC}},
  year         = {2019}
}
@article{DBLP:journals/corr/abs-1906-06147,
  author       = {Yasufumi Moriya and
                  Ramon Sanabria and
                  Florian Metze and
                  Gareth J. F. Jones},
  title        = {Grounding Object Detections With Transcriptions},
  journal      = {CoRR},
  volume       = {abs/1906.06147},
  year         = {2019}
}
@article{DBLP:journals/corr/abs-1907-00477,
  author       = {Tejas Srinivasan and
                  Ramon Sanabria and
                  Florian Metze},
  title        = {Analyzing Utility of Visual Context in Multimodal Speech Recognition
                  Under Noisy Conditions},
  journal      = {CoRR},
  volume       = {abs/1907.00477},
  year         = {2019}
}
@article{DBLP:journals/corr/abs-1910-12368,
  author       = {Tejas Srinivasan and
                  Ramon Sanabria and
                  Florian Metze},
  title        = {Multitask Learning For Different Subword Segmentations In Neural Machine
                  Translation},
  journal      = {CoRR},
  volume       = {abs/1910.12368},
  year         = {2019}
}
@inproceedings{DBLP:conf/icassp/DalmiaSMB18,
  author       = {Siddharth Dalmia and
                  Ramon Sanabria and
                  Florian Metze and
                  Alan W. Black},
  title        = {Sequence-Based Multi-Lingual Low Resource Speech Recognition},
  booktitle    = {{ICASSP}},
  pages        = {4909--4913},
  year         = {2018}
}
@inproceedings{DBLP:conf/icassp/PalaskarSM18,
  author       = {Shruti Palaskar and
                  Ramon Sanabria and
                  Florian Metze},
  title        = {End-to-end Multimodal Speech Recognition},
  booktitle    = {{ICASSP}},
  pages        = {5774--5778},
  year         = {2018}
}
@inproceedings{DBLP:conf/interspeech/ZenkelSMW18,
  author       = {Thomas Zenkel and
                  Ramon Sanabria and
                  Florian Metze and
                  Alex Waibel},
  title        = {Subword and Crossword Units for {CTC} Acoustic Models},
  booktitle    = {{INTERSPEECH}},
  pages        = {396--400},
  year         = {2018}
}
@inproceedings{DBLP:conf/mediaeval/MoriyaSMJ18,
  author       = {Yasufumi Moriya and
                  Ramon Sanabria and
                  Florian Metze and
                  Gareth J. F. Jones},
  title        = {Eyes and Ears Together: New Task for Multimodal Spoken Content Analysis},
  booktitle    = {MediaEval},
  year         = {2018}
}
@inproceedings{DBLP:conf/slt/SanabriaM18,
  author       = {Ramon Sanabria and
                  Florian Metze},
  title        = {Hierarchical Multitask Learning With {CTC}},
  booktitle    = {{SLT}},
  pages        = {485--490},
  year         = {2018}
}
@inproceedings{DBLP:conf/tac/HovyBCCGHMMCCHL18,
  author       = {Eduard H. Hovy and
                  Taylor Berg{-}Kirkpatrick and
                  Jaime G. Carbonell and
                  Hans Chalupsky and
                  Anatole Gershman and
                  Alexander G. Hauptmann and
                  Florian Metze and
                  Teruko Mitamura and
                  Aditi Chaudhary and
                  Xianyang Chen and
                  Bernie Po{-}Yao Huang and
                  Hector Zhengzhong Liu and
                  Xuezhe Ma and
                  Shruti Palaskar and
                  Dheeraj Rajagopal and
                  Maria Ryskina and
                  Ramon Sanabria},
  title        = {{OPERA:} Operations-oriented Probabilistic Extraction, Reasoning,
                  and Analysis},
  booktitle    = {{TAC}},
  year         = {2018}
}
@article{DBLP:journals/corr/abs-1802-07420,
  author       = {Siddharth Dalmia and
                  Ramon Sanabria and
                  Florian Metze and
                  Alan W. Black},
  title        = {Sequence-based Multi-lingual Low Resource Speech Recognition},
  journal      = {CoRR},
  volume       = {abs/1802.07420},
  year         = {2018}
}
@article{DBLP:journals/corr/abs-1804-09713,
  author       = {Shruti Palaskar and
                  Ramon Sanabria and
                  Florian Metze},
  title        = {End-to-End Multimodal Speech Recognition},
  journal      = {CoRR},
  volume       = {abs/1804.09713},
  year         = {2018}
}
@article{DBLP:journals/corr/abs-1807-07104,
  author       = {Ramon Sanabria and
                  Florian Metze},
  title        = {Hierarchical Multi Task Learning With {CTC}},
  journal      = {CoRR},
  volume       = {abs/1807.07104},
  year         = {2018}
}
@article{DBLP:journals/corr/abs-1811-00347,
  author       = {Ramon Sanabria and
                  Ozan Caglayan and
                  Shruti Palaskar and
                  Desmond Elliott and
                  Lo{\"{\i}}c Barrault and
                  Lucia Specia and
                  Florian Metze},
  title        = {How2: {A} Large-scale Dataset for Multimodal Language Understanding},
  journal      = {CoRR},
  volume       = {abs/1811.00347},
  year         = {2018}
}
@article{DBLP:journals/corr/abs-1811-03865,
  author       = {Ozan Caglayan and
                  Ramon Sanabria and
                  Shruti Palaskar and
                  Lo{\"{\i}}c Barrault and
                  Florian Metze},
  title        = {Multimodal Grounding for Sequence-to-Sequence Speech Recognition},
  journal      = {CoRR},
  volume       = {abs/1811.03865},
  year         = {2018}
}
@inproceedings{DBLP:conf/interspeech/ZenkelSMNSSW17,
  author       = {Thomas Zenkel and
                  Ramon Sanabria and
                  Florian Metze and
                  Jan Niehues and
                  Matthias Sperber and
                  Sebastian St{\"{u}}ker and
                  Alex Waibel},
  title        = {Comparison of Decoding Strategies for {CTC} Acoustic Models},
  booktitle    = {{INTERSPEECH}},
  pages        = {513--517},
  year         = {2017}
}
@inproceedings{DBLP:conf/nof/VilaltaVMSMCMA17,
  author       = {Ricard Vilalta and
                  Selva Via and
                  Ferm{\'{\i}}n Mira and
                  Luis Sanabria{-}Russo and
                  Ricardo Mart{\'{\i}}nez and
                  Ramon Casellas and
                  Raul Mu{\~{n}}oz and
                  Jesus Alonso{-}Zarate},
  title        = {Control and management of a connected car using {YANG/RESTCONF} and
                  cloud computing},
  booktitle    = {{NOF}},
  pages        = {120--122},
  year         = {2017}
}
@article{DBLP:journals/corr/abs-1708-04469,
  author       = {Thomas Zenkel and
                  Ramon Sanabria and
                  Florian Metze and
                  Jan Niehues and
                  Matthias Sperber and
                  Sebastian St{\"{u}}ker and
                  Alex Waibel},
  title        = {Comparison of Decoding Strategies for {CTC} Acoustic Models},
  journal      = {CoRR},
  volume       = {abs/1708.04469},
  year         = {2017}
}
@article{DBLP:journals/corr/abs-1712-06855,
  author       = {Thomas Zenkel and
                  Ramon Sanabria and
                  Florian Metze and
                  Alex Waibel},
  title        = {Subword and Crossword Units for {CTC} Acoustic Models},
  journal      = {CoRR},
  volume       = {abs/1712.06855},
  year         = {2017}
}
@article{DBLP:journals/corr/SanabriaMT16,
  author       = {Ramon Sanabria and
                  Florian Metze and
                  Fernando De la Torre},
  title        = {Robust end-to-end deep audiovisual speech recognition},
  journal      = {CoRR},
  volume       = {abs/1611.06986},
  year         = {2016}
}
@article{DBLP:journals/corr/abs-1207-1031,
  author       = {Jaume Barcel{\'{o}} and
                  Boris Bellalta and
                  Roger Baig and
                  Ramon Roca and
                  Albert Domingo and
                  Luis Sanabria{-}Russo and
                  Cristina Cano and
                  Miquel Oliver},
  title        = {Bottom-up Broadband Initiatives in the Commons for Europe Project},
  journal      = {CoRR},
  volume       = {abs/1207.1031},
  year         = {2012}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics