BibTeX records: Fabian Caba Heilbron

download as .bib file

@inproceedings{DBLP:conf/mmm/XingTCDYWBC24,
  author       = {Linzi Xing and
                  Quan Hung Tran and
                  Fabian Caba and
                  Franck Dernoncourt and
                  Seunghyun Yoon and
                  Zhaowen Wang and
                  Trung Bui and
                  Giuseppe Carenini},
  editor       = {Stevan Rudinac and
                  Alan Hanjalic and
                  Cynthia C. S. Liem and
                  Marcel Worring and
                  Bj{\"{o}}rn {\TH}{\'{o}}r J{\'{o}}nsson and
                  Bei Liu and
                  Yoko Yamakata},
  title        = {Multi-modal Video Topic Segmentation with Dual-Contrastive Domain
                  Adaptation},
  booktitle    = {MultiMedia Modeling - 30th International Conference, {MMM} 2024, Amsterdam,
                  The Netherlands, January 29 - February 2, 2024, Proceedings, Part
                  {III}},
  series       = {Lecture Notes in Computer Science},
  volume       = {14556},
  pages        = {410--424},
  publisher    = {Springer},
  year         = {2024},
  url          = {https://doi.org/10.1007/978-3-031-53311-2\_30},
  doi          = {10.1007/978-3-031-53311-2\_30},
  timestamp    = {Sat, 02 Mar 2024 21:19:05 +0100},
  biburl       = {https://dblp.org/rec/conf/mmm/XingTCDYWBC24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2404-03398,
  author       = {Dawit Mureja Argaw and
                  Seunghyun Yoon and
                  Fabian Caba Heilbron and
                  Hanieh Deilamsalehy and
                  Trung Bui and
                  Zhaowen Wang and
                  Franck Dernoncourt and
                  Joon Son Chung},
  title        = {Scaling Up Video Summarization Pretraining with Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2404.03398},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2404.03398},
  doi          = {10.48550/ARXIV.2404.03398},
  eprinttype    = {arXiv},
  eprint       = {2404.03398},
  timestamp    = {Mon, 13 May 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2404-03398.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2404-03477,
  author       = {Dawit Mureja Argaw and
                  Mattia Soldan and
                  Alejandro Pardo and
                  Chen Zhao and
                  Fabian Caba Heilbron and
                  Joon Son Chung and
                  Bernard Ghanem},
  title        = {Towards Automated Movie Trailer Generation},
  journal      = {CoRR},
  volume       = {abs/2404.03477},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2404.03477},
  doi          = {10.48550/ARXIV.2404.03477},
  eprinttype    = {arXiv},
  eprint       = {2404.03477},
  timestamp    = {Mon, 13 May 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2404-03477.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2404-03913,
  author       = {Gihyun Kwon and
                  Simon Jenni and
                  Dingzeyu Li and
                  Joon{-}Young Lee and
                  Jong Chul Ye and
                  Fabian Caba Heilbron},
  title        = {Concept Weaver: Enabling Multi-Concept Fusion in Text-to-Image Models},
  journal      = {CoRR},
  volume       = {abs/2404.03913},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2404.03913},
  doi          = {10.48550/ARXIV.2404.03913},
  eprinttype    = {arXiv},
  eprint       = {2404.03913},
  timestamp    = {Mon, 13 May 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2404-03913.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/RamazanovaEHZG23,
  author       = {Merey Ramazanova and
                  Victor Escorcia and
                  Fabian Caba Heilbron and
                  Chen Zhao and
                  Bernard Ghanem},
  title        = {{OWL} (Observe, Watch, Listen): Audiovisual Temporal Context for Localizing
                  Actions in Egocentric Videos},
  booktitle    = {{IEEE/CVF} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2023 - Workshops, Vancouver, BC, Canada, June 17-24, 2023},
  pages        = {4880--4890},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/CVPRW59228.2023.00516},
  doi          = {10.1109/CVPRW59228.2023.00516},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cvpr/RamazanovaEHZG23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/YehRSHJ23,
  author       = {Chun{-}Hsiao Yeh and
                  Bryan C. Russell and
                  Josef Sivic and
                  Fabian Caba Heilbron and
                  Simon Jenni},
  title        = {Meta-Personalizing Vision-Language Models to Find Named Instances
                  in Video},
  booktitle    = {{IEEE/CVF} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2023, Vancouver, BC, Canada, June 17-24, 2023},
  pages        = {19123--19132},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/CVPR52729.2023.01833},
  doi          = {10.1109/CVPR52729.2023.01833},
  timestamp    = {Thu, 28 Dec 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cvpr/YehRSHJ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/VillaAAAHHSG23,
  author       = {Andr{\'{e}}s Villa and
                  Juan Le{\'{o}}n Alc{\'{a}}zar and
                  Motasem Alfarra and
                  Kumail Alhamoud and
                  Julio Hurtado and
                  Fabian Caba Heilbron and
                  Alvaro Soto and
                  Bernard Ghanem},
  title        = {{PIVOT:} Prompting for Video Continual Learning},
  booktitle    = {{IEEE/CVF} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2023, Vancouver, BC, Canada, June 17-24, 2023},
  pages        = {24214--24223},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/CVPR52729.2023.02319},
  doi          = {10.1109/CVPR52729.2023.02319},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cvpr/VillaAAAHHSG23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccv/LeiCCJPL23,
  author       = {Ting Lei and
                  Fabian Caba and
                  Qingchao Chen and
                  Hailin Jin and
                  Yuxin Peng and
                  Yang Liu},
  title        = {Efficient Adaptive Human-Object Interaction Detection with Concept-guided
                  Memory},
  booktitle    = {{IEEE/CVF} International Conference on Computer Vision, {ICCV} 2023,
                  Paris, France, October 1-6, 2023},
  pages        = {6457--6467},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/ICCV51070.2023.00596},
  doi          = {10.1109/ICCV51070.2023.00596},
  timestamp    = {Tue, 26 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iccv/LeiCCJPL23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccv/ArgawLWKH23,
  author       = {Dawit Mureja Argaw and
                  Joon{-}Young Lee and
                  Markus Woodson and
                  In So Kweon and
                  Fabian Caba Heilbron},
  title        = {Long-range Multimodal Pretraining for Movie Understanding},
  booktitle    = {{IEEE/CVF} International Conference on Computer Vision, {ICCV} 2023,
                  Paris, France, October 1-6, 2023},
  pages        = {13346--13357},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/ICCV51070.2023.01232},
  doi          = {10.1109/ICCV51070.2023.01232},
  timestamp    = {Mon, 22 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iccv/ArgawLWKH23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccv/BarriosSCHG23,
  author       = {Wayner Barrios and
                  Mattia Soldan and
                  Alberto Mario Ceballos{-}Arroyo and
                  Fabian Caba Heilbron and
                  Bernard Ghanem},
  title        = {Localizing Moments in Long Video Via Multimodal Guidance},
  booktitle    = {{IEEE/CVF} International Conference on Computer Vision, {ICCV} 2023,
                  Paris, France, October 1-6, 2023},
  pages        = {13621--13632},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/ICCV51070.2023.01257},
  doi          = {10.1109/ICCV51070.2023.01257},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iccv/BarriosSCHG23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-13372,
  author       = {Wayner Barrios and
                  Mattia Soldan and
                  Fabian Caba Heilbron and
                  Alberto Mario Ceballos{-}Arroyo and
                  Bernard Ghanem},
  title        = {Localizing Moments in Long Video Via Multimodal Guidance},
  journal      = {CoRR},
  volume       = {abs/2302.13372},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.13372},
  doi          = {10.48550/ARXIV.2302.13372},
  eprinttype    = {arXiv},
  eprint       = {2302.13372},
  timestamp    = {Tue, 28 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-13372.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-10169,
  author       = {Chun{-}Hsiao Yeh and
                  Bryan C. Russell and
                  Josef Sivic and
                  Fabian Caba Heilbron and
                  Simon Jenni},
  title        = {Meta-Personalizing Vision-Language Models to Find Named Instances
                  in Video},
  journal      = {CoRR},
  volume       = {abs/2306.10169},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.10169},
  doi          = {10.48550/ARXIV.2306.10169},
  eprinttype    = {arXiv},
  eprint       = {2306.10169},
  timestamp    = {Thu, 28 Dec 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-10169.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2308-09775,
  author       = {Dawit Mureja Argaw and
                  Joon{-}Young Lee and
                  Markus Woodson and
                  In So Kweon and
                  Fabian Caba Heilbron},
  title        = {Long-range Multimodal Pretraining for Movie Understanding},
  journal      = {CoRR},
  volume       = {abs/2308.09775},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2308.09775},
  doi          = {10.48550/ARXIV.2308.09775},
  eprinttype    = {arXiv},
  eprint       = {2308.09775},
  timestamp    = {Fri, 25 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2308-09775.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2309-03696,
  author       = {Ting Lei and
                  Fabian Caba and
                  Qingchao Chen and
                  Hailin Jin and
                  Yuxin Peng and
                  Yang Liu},
  title        = {Efficient Adaptive Human-Object Interaction Detection with Concept-guided
                  Memory},
  journal      = {CoRR},
  volume       = {abs/2309.03696},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.03696},
  doi          = {10.48550/ARXIV.2309.03696},
  eprinttype    = {arXiv},
  eprint       = {2309.03696},
  timestamp    = {Tue, 26 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-03696.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2312-00220,
  author       = {Linzi Xing and
                  Quan Hung Tran and
                  Fabian Caba and
                  Franck Dernoncourt and
                  Seunghyun Yoon and
                  Zhaowen Wang and
                  Trung Bui and
                  Giuseppe Carenini},
  title        = {Multi-Modal Video Topic Segmentation with Dual-Contrastive Domain
                  Adaptation},
  journal      = {CoRR},
  volume       = {abs/2312.00220},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2312.00220},
  doi          = {10.48550/ARXIV.2312.00220},
  eprinttype    = {arXiv},
  eprint       = {2312.00220},
  timestamp    = {Fri, 08 Dec 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2312-00220.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/bmvc/CastroC22,
  author       = {Santiago Castro and
                  Fabian Caba},
  title        = {FitCLIP: Refining Large-Scale Pretrained Image-Text Models for Zero-Shot
                  Video Understanding Tasks},
  booktitle    = {33rd British Machine Vision Conference 2022, {BMVC} 2022, London,
                  UK, November 21-24, 2022},
  pages        = {939},
  publisher    = {{BMVA} Press},
  year         = {2022},
  url          = {https://bmvc2022.mpi-inf.mpg.de/939/},
  timestamp    = {Thu, 16 Feb 2023 16:15:04 +0100},
  biburl       = {https://dblp.org/rec/conf/bmvc/CastroC22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/SoldanPAH0GG22,
  author       = {Mattia Soldan and
                  Alejandro Pardo and
                  Juan Le{\'{o}}n Alc{\'{a}}zar and
                  Fabian Caba Heilbron and
                  Chen Zhao and
                  Silvio Giancola and
                  Bernard Ghanem},
  title        = {{MAD:} {A} Scalable Dataset for Language Grounding in Videos from
                  Movie Audio Descriptions},
  booktitle    = {{IEEE/CVF} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2022, New Orleans, LA, USA, June 18-24, 2022},
  pages        = {5016--5025},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/CVPR52688.2022.00497},
  doi          = {10.1109/CVPR52688.2022.00497},
  timestamp    = {Wed, 07 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cvpr/SoldanPAH0GG22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/VillaAEHAG22,
  author       = {Andr{\'{e}}s Villa and
                  Kumail Alhamoud and
                  Victor Escorcia and
                  Fabian Caba Heilbron and
                  Juan Le{\'{o}}n Alc{\'{a}}zar and
                  Bernard Ghanem},
  title        = {vCLIMB: {A} Novel Video Class Incremental Learning Benchmark},
  booktitle    = {{IEEE/CVF} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2022, New Orleans, LA, USA, June 18-24, 2022},
  pages        = {19013--19022},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/CVPR52688.2022.01845},
  doi          = {10.1109/CVPR52688.2022.01845},
  timestamp    = {Wed, 07 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cvpr/VillaAEHAG22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eccv/ArgawHLWK22,
  author       = {Dawit Mureja Argaw and
                  Fabian Caba Heilbron and
                  Joon{-}Young Lee and
                  Markus Woodson and
                  In So Kweon},
  editor       = {Shai Avidan and
                  Gabriel J. Brostow and
                  Moustapha Ciss{\'{e}} and
                  Giovanni Maria Farinella and
                  Tal Hassner},
  title        = {The Anatomy of Video Editing: {A} Dataset and Benchmark Suite for
                  AI-Assisted Video Editing},
  booktitle    = {Computer Vision - {ECCV} 2022 - 17th European Conference, Tel Aviv,
                  Israel, October 23-27, 2022, Proceedings, Part {VIII}},
  series       = {Lecture Notes in Computer Science},
  volume       = {13668},
  pages        = {201--218},
  publisher    = {Springer},
  year         = {2022},
  url          = {https://doi.org/10.1007/978-3-031-20074-8\_12},
  doi          = {10.1007/978-3-031-20074-8\_12},
  timestamp    = {Wed, 16 Nov 2022 21:55:17 +0100},
  biburl       = {https://dblp.org/rec/conf/eccv/ArgawHLWK22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eccv/PardoHATG22,
  author       = {Alejandro Pardo and
                  Fabian Caba Heilbron and
                  Juan Le{\'{o}}n Alc{\'{a}}zar and
                  Ali K. Thabet and
                  Bernard Ghanem},
  editor       = {Shai Avidan and
                  Gabriel J. Brostow and
                  Moustapha Ciss{\'{e}} and
                  Giovanni Maria Farinella and
                  Tal Hassner},
  title        = {MovieCuts: {A} New Dataset and Benchmark for Cut Type Recognition},
  booktitle    = {Computer Vision - {ECCV} 2022 - 17th European Conference, Tel Aviv,
                  Israel, October 23-27, 2022, Proceedings, Part {VII}},
  series       = {Lecture Notes in Computer Science},
  volume       = {13667},
  pages        = {668--685},
  publisher    = {Springer},
  year         = {2022},
  url          = {https://doi.org/10.1007/978-3-031-20071-7\_39},
  doi          = {10.1007/978-3-031-20071-7\_39},
  timestamp    = {Sun, 25 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/eccv/PardoHATG22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/mm/XiongHL22,
  author       = {Yu Xiong and
                  Fabian Caba Heilbron and
                  Dahua Lin},
  editor       = {Jo{\~{a}}o Magalh{\~{a}}es and
                  Alberto Del Bimbo and
                  Shin'ichi Satoh and
                  Nicu Sebe and
                  Xavier Alameda{-}Pineda and
                  Qin Jin and
                  Vincent Oria and
                  Laura Toni},
  title        = {Transcript to Video: Efficient Clip Sequencing from Texts},
  booktitle    = {{MM} '22: The 30th {ACM} International Conference on Multimedia, Lisboa,
                  Portugal, October 10 - 14, 2022},
  pages        = {5407--5416},
  publisher    = {{ACM}},
  year         = {2022},
  url          = {https://doi.org/10.1145/3503161.3548268},
  doi          = {10.1145/3503161.3548268},
  timestamp    = {Fri, 14 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/mm/XiongHL22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2201-09381,
  author       = {Andr{\'{e}}s Villa and
                  Kumail Alhamoud and
                  Juan Le{\'{o}}n Alc{\'{a}}zar and
                  Fabian Caba Heilbron and
                  Victor Escorcia and
                  Bernard Ghanem},
  title        = {vCLIMB: {A} Novel Video Class Incremental Learning Benchmark},
  journal      = {CoRR},
  volume       = {abs/2201.09381},
  year         = {2022},
  url          = {https://arxiv.org/abs/2201.09381},
  eprinttype    = {arXiv},
  eprint       = {2201.09381},
  timestamp    = {Thu, 23 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2201-09381.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2202-04947,
  author       = {Merey Ramazanova and
                  Victor Escorcia and
                  Fabian Caba Heilbron and
                  Chen Zhao and
                  Bernard Ghanem},
  title        = {{OWL} (Observe, Watch, Listen): Localizing Actions in Egocentric Video
                  via Audiovisual Temporal Context},
  journal      = {CoRR},
  volume       = {abs/2202.04947},
  year         = {2022},
  url          = {https://arxiv.org/abs/2202.04947},
  eprinttype    = {arXiv},
  eprint       = {2202.04947},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2202-04947.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2203-13371,
  author       = {Santiago Castro and
                  Fabian Caba Heilbron},
  title        = {FitCLIP: Refining Large-Scale Pretrained Image-Text Models for Zero-Shot
                  Video Understanding Tasks},
  journal      = {CoRR},
  volume       = {abs/2203.13371},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2203.13371},
  doi          = {10.48550/ARXIV.2203.13371},
  eprinttype    = {arXiv},
  eprint       = {2203.13371},
  timestamp    = {Tue, 29 Mar 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2203-13371.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2205-05609,
  author       = {Simon Jenni and
                  Markus Woodson and
                  Fabian Caba Heilbron},
  title        = {Video-ReTime: Learning Temporally Varying Speediness for Time Remapping},
  journal      = {CoRR},
  volume       = {abs/2205.05609},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2205.05609},
  doi          = {10.48550/ARXIV.2205.05609},
  eprinttype    = {arXiv},
  eprint       = {2205.05609},
  timestamp    = {Tue, 17 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2205-05609.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2207-09812,
  author       = {Dawit Mureja Argaw and
                  Fabian Caba Heilbron and
                  Joon{-}Young Lee and
                  Markus Woodson and
                  In So Kweon},
  title        = {The Anatomy of Video Editing: {A} Dataset and Benchmark Suite for
                  AI-Assisted Video Editing},
  journal      = {CoRR},
  volume       = {abs/2207.09812},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2207.09812},
  doi          = {10.48550/ARXIV.2207.09812},
  eprinttype    = {arXiv},
  eprint       = {2207.09812},
  timestamp    = {Mon, 25 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2207-09812.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-12492,
  author       = {David Chuan{-}En Lin and
                  Fabian Caba Heilbron and
                  Joon{-}Young Lee and
                  Oliver Wang and
                  Nikolas Martelaro},
  title        = {VideoMap: Video Editing in Latent Space},
  journal      = {CoRR},
  volume       = {abs/2211.12492},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.12492},
  doi          = {10.48550/ARXIV.2211.12492},
  eprinttype    = {arXiv},
  eprint       = {2211.12492},
  timestamp    = {Thu, 24 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-12492.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-12493,
  author       = {David Chuan{-}En Lin and
                  Fabian Caba Heilbron and
                  Joon{-}Young Lee and
                  Oliver Wang and
                  Nikolas Martelaro},
  title        = {Videogenic: Video Highlights via Photogenic Moments},
  journal      = {CoRR},
  volume       = {abs/2211.12493},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.12493},
  doi          = {10.48550/ARXIV.2211.12493},
  eprinttype    = {arXiv},
  eprint       = {2211.12493},
  timestamp    = {Thu, 24 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-12493.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2212-04842,
  author       = {Andr{\'{e}}s Villa and
                  Juan Le{\'{o}}n Alc{\'{a}}zar and
                  Motasem Alfarra and
                  Kumail Alhamoud and
                  Julio Hurtado and
                  Fabian Caba Heilbron and
                  Alvaro Soto and
                  Bernard Ghanem},
  title        = {{PIVOT:} Prompting for Video Continual Learning},
  journal      = {CoRR},
  volume       = {abs/2212.04842},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2212.04842},
  doi          = {10.48550/ARXIV.2212.04842},
  eprinttype    = {arXiv},
  eprint       = {2212.04842},
  timestamp    = {Mon, 02 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2212-04842.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ral/HuPHWLSS21,
  author       = {Ping Hu and
                  Federico Perazzi and
                  Fabian Caba Heilbron and
                  Oliver Wang and
                  Zhe Lin and
                  Kate Saenko and
                  Stan Sclaroff},
  title        = {Real-Time Semantic Segmentation With Fast Attention},
  journal      = {{IEEE} Robotics Autom. Lett.},
  volume       = {6},
  number       = {1},
  pages        = {263--270},
  year         = {2021},
  url          = {https://doi.org/10.1109/LRA.2020.3039744},
  doi          = {10.1109/LRA.2020.3039744},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ral/HuPHWLSS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/AlcazarCMPLAG21,
  author       = {Juan Leon Alcazar and
                  Fabian Caba and
                  Long Mai and
                  Federico Perazzi and
                  Joon{-}Young Lee and
                  Pablo Arbel{\'{a}}ez and
                  Bernard Ghanem},
  title        = {{APES:} Audiovisual Person Search in Untrimmed Video},
  booktitle    = {{IEEE} Conference on Computer Vision and Pattern Recognition Workshops,
                  {CVPR} Workshops 2021, virtual, June 19-25, 2021},
  pages        = {1720--1729},
  publisher    = {Computer Vision Foundation / {IEEE}},
  year         = {2021},
  url          = {https://openaccess.thecvf.com/content/CVPR2021W/MULA/html/Alcazar\_APES\_Audiovisual\_Person\_Search\_in\_Untrimmed\_Video\_CVPRW\_2021\_paper.html},
  doi          = {10.1109/CVPRW53098.2021.00188},
  timestamp    = {Thu, 18 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cvpr/AlcazarCMPLAG21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccv/AlcazarHTG21,
  author       = {Juan Le{\'{o}}n Alc{\'{a}}zar and
                  Fabian Caba Heilbron and
                  Ali K. Thabet and
                  Bernard Ghanem},
  title        = {{MAAS:} Multi-modal Assignation for Active Speaker Detection},
  booktitle    = {2021 {IEEE/CVF} International Conference on Computer Vision, {ICCV}
                  2021, Montreal, QC, Canada, October 10-17, 2021},
  pages        = {265--274},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/ICCV48922.2021.00033},
  doi          = {10.1109/ICCV48922.2021.00033},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iccv/AlcazarHTG21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccv/PardoHATG21,
  author       = {Alejandro Pardo and
                  Fabian Caba Heilbron and
                  Juan Le{\'{o}}n Alc{\'{a}}zar and
                  Ali K. Thabet and
                  Bernard Ghanem},
  title        = {Learning to Cut by Watching Movies},
  booktitle    = {2021 {IEEE/CVF} International Conference on Computer Vision, {ICCV}
                  2021, Montreal, QC, Canada, October 10-17, 2021},
  pages        = {6838--6848},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/ICCV48922.2021.00678},
  doi          = {10.1109/ICCV48922.2021.00678},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iccv/PardoHATG21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccvw/HuangBWCA21,
  author       = {Yuzhong Huang and
                  Xue Bai and
                  Oliver Wang and
                  Fabian Caba and
                  Aseem Agarwala},
  title        = {Learning Where to Cut from Edited Videos},
  booktitle    = {{IEEE/CVF} International Conference on Computer Vision Workshops,
                  {ICCVW} 2021, Montreal, BC, Canada, October 11-17, 2021},
  pages        = {3208--3216},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/ICCVW54120.2021.00360},
  doi          = {10.1109/ICCVW54120.2021.00360},
  timestamp    = {Fri, 03 Dec 2021 17:37:22 +0100},
  biburl       = {https://dblp.org/rec/conf/iccvw/HuangBWCA21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/wacv/PardoAHTG21,
  author       = {Alejandro Pardo and
                  Humam Alwassel and
                  Fabian Caba Heilbron and
                  Ali K. Thabet and
                  Bernard Ghanem},
  title        = {RefineLoc: Iterative Refinement for Weakly-Supervised Action Localization},
  booktitle    = {{IEEE} Winter Conference on Applications of Computer Vision, {WACV}
                  2021, Waikoloa, HI, USA, January 3-8, 2021},
  pages        = {3318--3327},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/WACV48630.2021.00336},
  doi          = {10.1109/WACV48630.2021.00336},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/wacv/PardoAHTG21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2101-03682,
  author       = {Juan Le{\'{o}}n Alc{\'{a}}zar and
                  Fabian Caba Heilbron and
                  Ali K. Thabet and
                  Bernard Ghanem},
  title        = {{MAAS:} Multi-modal Assignation for Active Speaker Detection},
  journal      = {CoRR},
  volume       = {abs/2101.03682},
  year         = {2021},
  url          = {https://arxiv.org/abs/2101.03682},
  eprinttype    = {arXiv},
  eprint       = {2101.03682},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2101-03682.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-01667,
  author       = {Juan Leon Alcazar and
                  Long Mai and
                  Federico Perazzi and
                  Joon{-}Young Lee and
                  Pablo Arbel{\'{a}}ez and
                  Bernard Ghanem and
                  Fabian Caba Heilbron},
  title        = {{APES:} Audiovisual Person Search in Untrimmed Video},
  journal      = {CoRR},
  volume       = {abs/2106.01667},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.01667},
  eprinttype    = {arXiv},
  eprint       = {2106.01667},
  timestamp    = {Thu, 18 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-01667.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2107-11851,
  author       = {Yu Xiong and
                  Fabian Caba Heilbron and
                  Dahua Lin},
  title        = {Transcript to Video: Efficient Clip Sequencing from Texts},
  journal      = {CoRR},
  volume       = {abs/2107.11851},
  year         = {2021},
  url          = {https://arxiv.org/abs/2107.11851},
  eprinttype    = {arXiv},
  eprint       = {2107.11851},
  timestamp    = {Thu, 29 Jul 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2107-11851.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2108-04294,
  author       = {Alejandro Pardo and
                  Fabian Caba Heilbron and
                  Juan Le{\'{o}}n Alc{\'{a}}zar and
                  Ali K. Thabet and
                  Bernard Ghanem},
  title        = {Learning to Cut by Watching Movies},
  journal      = {CoRR},
  volume       = {abs/2108.04294},
  year         = {2021},
  url          = {https://arxiv.org/abs/2108.04294},
  eprinttype    = {arXiv},
  eprint       = {2108.04294},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2108-04294.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2109-05569,
  author       = {Alejandro Pardo and
                  Fabian Caba Heilbron and
                  Juan Le{\'{o}}n Alc{\'{a}}zar and
                  Ali K. Thabet and
                  Bernard Ghanem},
  title        = {MovieCuts: {A} New Dataset and Benchmark for Cut Type Recognition},
  journal      = {CoRR},
  volume       = {abs/2109.05569},
  year         = {2021},
  url          = {https://arxiv.org/abs/2109.05569},
  eprinttype    = {arXiv},
  eprint       = {2109.05569},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2109-05569.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2112-00431,
  author       = {Mattia Soldan and
                  Alejandro Pardo and
                  Juan Le{\'{o}}n Alc{\'{a}}zar and
                  Fabian Caba Heilbron and
                  Chen Zhao and
                  Silvio Giancola and
                  Bernard Ghanem},
  title        = {{MAD:} {A} Scalable Dataset for Language Grounding in Videos from
                  Movie Audio Descriptions},
  journal      = {CoRR},
  volume       = {abs/2112.00431},
  year         = {2021},
  url          = {https://arxiv.org/abs/2112.00431},
  eprinttype    = {arXiv},
  eprint       = {2112.00431},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2112-00431.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/access/Baptista-RiosLH20,
  author       = {Marcos Baptista{-}R{\'{\i}}os and
                  Roberto Javier L{\'{o}}pez{-}Sastre and
                  Fabian Caba Heilbron and
                  Jan C. van Gemert and
                  Francisco Javier Acevedo{-}Rodr{\'{\i}}guez and
                  Saturnino Maldonado{-}Basc{\'{o}}n},
  title        = {Rethinking Online Action Detection in Untrimmed Videos: {A} Novel
                  Online Evaluation Protocol},
  journal      = {{IEEE} Access},
  volume       = {8},
  pages        = {5139--5146},
  year         = {2020},
  url          = {https://doi.org/10.1109/ACCESS.2019.2961789},
  doi          = {10.1109/ACCESS.2019.2961789},
  timestamp    = {Fri, 21 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/access/Baptista-RiosLH20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/HuCWLSP20,
  author       = {Ping Hu and
                  Fabian Caba and
                  Oliver Wang and
                  Zhe Lin and
                  Stan Sclaroff and
                  Federico Perazzi},
  title        = {Temporally Distributed Networks for Fast Video Semantic Segmentation},
  booktitle    = {2020 {IEEE/CVF} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2020, Seattle, WA, USA, June 13-19, 2020},
  pages        = {8815--8824},
  publisher    = {Computer Vision Foundation / {IEEE}},
  year         = {2020},
  url          = {https://openaccess.thecvf.com/content\_CVPR\_2020/html/Hu\_Temporally\_Distributed\_Networks\_for\_Fast\_Video\_Semantic\_Segmentation\_CVPR\_2020\_paper.html},
  doi          = {10.1109/CVPR42600.2020.00884},
  timestamp    = {Tue, 31 Aug 2021 14:00:04 +0200},
  biburl       = {https://dblp.org/rec/conf/cvpr/HuCWLSP20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/AlcazarCMPLAG20,
  author       = {Juan Le{\'{o}}n Alc{\'{a}}zar and
                  Fabian Caba and
                  Long Mai and
                  Federico Perazzi and
                  Joon{-}Young Lee and
                  Pablo Arbel{\'{a}}ez and
                  Bernard Ghanem},
  title        = {Active Speakers in Context},
  booktitle    = {2020 {IEEE/CVF} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2020, Seattle, WA, USA, June 13-19, 2020},
  pages        = {12462--12471},
  publisher    = {Computer Vision Foundation / {IEEE}},
  year         = {2020},
  url          = {https://openaccess.thecvf.com/content\_CVPR\_2020/html/Alcazar\_Active\_Speakers\_in\_Context\_CVPR\_2020\_paper.html},
  doi          = {10.1109/CVPR42600.2020.01248},
  timestamp    = {Mon, 30 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cvpr/AlcazarCMPLAG20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2003-09970,
  author       = {Marcos Baptista{-}R{\'{\i}}os and
                  Roberto Javier L{\'{o}}pez{-}Sastre and
                  Fabian Caba Heilbron and
                  Jan van Gemert and
                  Francisco Javier Acevedo{-}Rodr{\'{\i}}guez and
                  Saturnino Maldonado{-}Basc{\'{o}}n},
  title        = {The Instantaneous Accuracy: a Novel Metric for the Problem of Online
                  Human Behaviour Recognition in Untrimmed Videos},
  journal      = {CoRR},
  volume       = {abs/2003.09970},
  year         = {2020},
  url          = {https://arxiv.org/abs/2003.09970},
  eprinttype    = {arXiv},
  eprint       = {2003.09970},
  timestamp    = {Wed, 01 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2003-09970.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2003-12041,
  author       = {Marcos Baptista{-}R{\'{\i}}os and
                  Roberto Javier L{\'{o}}pez{-}Sastre and
                  Fabian Caba Heilbron and
                  Jan van Gemert and
                  Francisco Javier Acevedo{-}Rodr{\'{\i}}guez and
                  Saturnino Maldonado{-}Basc{\'{o}}n},
  title        = {Rethinking Online Action Detection in Untrimmed Videos: {A} Novel
                  Online Evaluation Protocol},
  journal      = {CoRR},
  volume       = {abs/2003.12041},
  year         = {2020},
  url          = {https://arxiv.org/abs/2003.12041},
  eprinttype    = {arXiv},
  eprint       = {2003.12041},
  timestamp    = {Wed, 01 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2003-12041.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2004-01800,
  author       = {Ping Hu and
                  Fabian Caba Heilbron and
                  Oliver Wang and
                  Zhe L. Lin and
                  Stan Sclaroff and
                  Federico Perazzi},
  title        = {Temporally Distributed Networks for Fast Video Semantic Segmentation},
  journal      = {CoRR},
  volume       = {abs/2004.01800},
  year         = {2020},
  url          = {https://arxiv.org/abs/2004.01800},
  eprinttype    = {arXiv},
  eprint       = {2004.01800},
  timestamp    = {Wed, 08 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2004-01800.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2005-09812,
  author       = {Juan Leon Alcazar and
                  Fabian Caba Heilbron and
                  Long Mai and
                  Federico Perazzi and
                  Joon{-}Young Lee and
                  Pablo Arbel{\'{a}}ez and
                  Bernard Ghanem},
  title        = {Active Speakers in Context},
  journal      = {CoRR},
  volume       = {abs/2005.09812},
  year         = {2020},
  url          = {https://arxiv.org/abs/2005.09812},
  eprinttype    = {arXiv},
  eprint       = {2005.09812},
  timestamp    = {Thu, 18 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2005-09812.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2007-03815,
  author       = {Ping Hu and
                  Federico Perazzi and
                  Fabian Caba Heilbron and
                  Oliver Wang and
                  Zhe Lin and
                  Kate Saenko and
                  Stan Sclaroff},
  title        = {Real-time Semantic Segmentation with Fast Attention},
  journal      = {CoRR},
  volume       = {abs/2007.03815},
  year         = {2020},
  url          = {https://arxiv.org/abs/2007.03815},
  eprinttype    = {arXiv},
  eprint       = {2007.03815},
  timestamp    = {Wed, 09 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2007-03815.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccvw/Baptista-RiosLH19,
  author       = {Marcos Baptista{-}R{\'{\i}}os and
                  Roberto Javier L{\'{o}}pez{-}Sastre and
                  Fabian Caba Heilbron and
                  Jan van Gemert and
                  Francisco Javier Acevedo{-}Rodr{\'{\i}}guez and
                  Saturnino Maldonado{-}Basc{\'{o}}n},
  title        = {The Instantaneous Accuracy: a Novel Metric for the Problem of Online
                  Human Behaviour Recognition in Untrimmed Videos},
  booktitle    = {2019 {IEEE/CVF} International Conference on Computer Vision Workshops,
                  {ICCV} Workshops 2019, Seoul, Korea (South), October 27-28, 2019},
  pages        = {1282--1284},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ICCVW.2019.00162},
  doi          = {10.1109/ICCVW.2019.00162},
  timestamp    = {Thu, 12 Mar 2020 10:53:35 +0100},
  biburl       = {https://dblp.org/rec/conf/iccvw/Baptista-RiosLH19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccvw/HeilbronPBD19,
  author       = {Fabian Caba Heilbron and
                  Bojan Pepik and
                  Zohar Barzelay and
                  Michael Donoser},
  title        = {Clothing Recognition in the Wild using the Amazon Catalog},
  booktitle    = {2019 {IEEE/CVF} International Conference on Computer Vision Workshops,
                  {ICCV} Workshops 2019, Seoul, Korea (South), October 27-28, 2019},
  pages        = {3145--3148},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ICCVW.2019.00385},
  doi          = {10.1109/ICCVW.2019.00385},
  timestamp    = {Thu, 12 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iccvw/HeilbronPBD19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1904-00227,
  author       = {Humam Alwassel and
                  Fabian Caba Heilbron and
                  Ali K. Thabet and
                  Bernard Ghanem},
  title        = {RefineLoc: Iterative Refinement for Weakly-Supervised Action Localization},
  journal      = {CoRR},
  volume       = {abs/1904.00227},
  year         = {2019},
  url          = {http://arxiv.org/abs/1904.00227},
  eprinttype    = {arXiv},
  eprint       = {1904.00227},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1904-00227.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eccv/HeilbronLJG18,
  author       = {Fabian Caba Heilbron and
                  Joon{-}Young Lee and
                  Hailin Jin and
                  Bernard Ghanem},
  editor       = {Vittorio Ferrari and
                  Martial Hebert and
                  Cristian Sminchisescu and
                  Yair Weiss},
  title        = {What Do {I} Annotate Next? An Empirical Study of Active Learning for
                  Action Localization},
  booktitle    = {Computer Vision - {ECCV} 2018 - 15th European Conference, Munich,
                  Germany, September 8-14, 2018, Proceedings, Part {XI}},
  series       = {Lecture Notes in Computer Science},
  volume       = {11215},
  pages        = {212--229},
  publisher    = {Springer},
  year         = {2018},
  url          = {https://doi.org/10.1007/978-3-030-01252-6\_13},
  doi          = {10.1007/978-3-030-01252-6\_13},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/eccv/HeilbronLJG18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eccv/AlwasselHG18,
  author       = {Humam Alwassel and
                  Fabian Caba Heilbron and
                  Bernard Ghanem},
  editor       = {Vittorio Ferrari and
                  Martial Hebert and
                  Cristian Sminchisescu and
                  Yair Weiss},
  title        = {Action Search: Spotting Actions in Videos and Its Application to Temporal
                  Action Localization},
  booktitle    = {Computer Vision - {ECCV} 2018 - 15th European Conference, Munich,
                  Germany, September 8-14, 2018, Proceedings, Part {IX}},
  series       = {Lecture Notes in Computer Science},
  volume       = {11213},
  pages        = {253--269},
  publisher    = {Springer},
  year         = {2018},
  url          = {https://doi.org/10.1007/978-3-030-01240-3\_16},
  doi          = {10.1007/978-3-030-01240-3\_16},
  timestamp    = {Sat, 19 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eccv/AlwasselHG18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eccv/AlwasselHEG18,
  author       = {Humam Alwassel and
                  Fabian Caba Heilbron and
                  Victor Escorcia and
                  Bernard Ghanem},
  editor       = {Vittorio Ferrari and
                  Martial Hebert and
                  Cristian Sminchisescu and
                  Yair Weiss},
  title        = {Diagnosing Error in Temporal Action Detectors},
  booktitle    = {Computer Vision - {ECCV} 2018 - 15th European Conference, Munich,
                  Germany, September 8-14, 2018, Proceedings, Part {III}},
  series       = {Lecture Notes in Computer Science},
  volume       = {11207},
  pages        = {264--280},
  publisher    = {Springer},
  year         = {2018},
  url          = {https://doi.org/10.1007/978-3-030-01219-9\_16},
  doi          = {10.1007/978-3-030-01219-9\_16},
  timestamp    = {Fri, 09 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eccv/AlwasselHEG18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1807-10706,
  author       = {Humam Alwassel and
                  Fabian Caba Heilbron and
                  Victor Escorcia and
                  Bernard Ghanem},
  title        = {Diagnosing Error in Temporal Action Detectors},
  journal      = {CoRR},
  volume       = {abs/1807.10706},
  year         = {2018},
  url          = {http://arxiv.org/abs/1807.10706},
  eprinttype    = {arXiv},
  eprint       = {1807.10706},
  timestamp    = {Fri, 09 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1807-10706.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1808-03766,
  author       = {Bernard Ghanem and
                  Juan Carlos Niebles and
                  Cees Snoek and
                  Fabian Caba Heilbron and
                  Humam Alwassel and
                  Victor Escorcia and
                  Ranjay Krishna and
                  Shyamal Buch and
                  Cuong Duc Dao},
  title        = {The ActivityNet Large-Scale Activity Recognition Challenge 2018 Summary},
  journal      = {CoRR},
  volume       = {abs/1808.03766},
  year         = {2018},
  url          = {http://arxiv.org/abs/1808.03766},
  eprinttype    = {arXiv},
  eprint       = {1808.03766},
  timestamp    = {Sun, 02 Sep 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1808-03766.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/HeilbronBEG17,
  author       = {Fabian Caba Heilbron and
                  Wayner Barrios and
                  Victor Escorcia and
                  Bernard Ghanem},
  title        = {{SCC:} Semantic Context Cascade for Efficient Action Detection},
  booktitle    = {2017 {IEEE} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2017, Honolulu, HI, USA, July 21-26, 2017},
  pages        = {3175--3184},
  publisher    = {{IEEE} Computer Society},
  year         = {2017},
  url          = {https://doi.org/10.1109/CVPR.2017.338},
  doi          = {10.1109/CVPR.2017.338},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cvpr/HeilbronBEG17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/AlwasselHG17,
  author       = {Humam Alwassel and
                  Fabian Caba Heilbron and
                  Bernard Ghanem},
  title        = {Action Search: Learning to Search for Human Activities in Untrimmed
                  Videos},
  journal      = {CoRR},
  volume       = {abs/1706.04269},
  year         = {2017},
  url          = {http://arxiv.org/abs/1706.04269},
  eprinttype    = {arXiv},
  eprint       = {1706.04269},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/AlwasselHG17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1710-08011,
  author       = {Bernard Ghanem and
                  Juan Carlos Niebles and
                  Cees Snoek and
                  Fabian Caba Heilbron and
                  Humam Alwassel and
                  Ranjay Krishna and
                  Victor Escorcia and
                  Kenji Hata and
                  Shyamal Buch},
  title        = {ActivityNet Challenge 2017 Summary},
  journal      = {CoRR},
  volume       = {abs/1710.08011},
  year         = {2017},
  url          = {http://arxiv.org/abs/1710.08011},
  eprinttype    = {arXiv},
  eprint       = {1710.08011},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1710-08011.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/HeilbronNG16,
  author       = {Fabian Caba Heilbron and
                  Juan Carlos Niebles and
                  Bernard Ghanem},
  title        = {Fast Temporal Activity Proposals for Efficient Detection of Human
                  Actions in Untrimmed Videos},
  booktitle    = {2016 {IEEE} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2016, Las Vegas, NV, USA, June 27-30, 2016},
  pages        = {1914--1923},
  publisher    = {{IEEE} Computer Society},
  year         = {2016},
  url          = {https://doi.org/10.1109/CVPR.2016.211},
  doi          = {10.1109/CVPR.2016.211},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cvpr/HeilbronNG16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eccv/EscorciaHNG16,
  author       = {Victor Escorcia and
                  Fabian Caba Heilbron and
                  Juan Carlos Niebles and
                  Bernard Ghanem},
  editor       = {Bastian Leibe and
                  Jiri Matas and
                  Nicu Sebe and
                  Max Welling},
  title        = {DAPs: Deep Action Proposals for Action Understanding},
  booktitle    = {Computer Vision - {ECCV} 2016 - 14th European Conference, Amsterdam,
                  The Netherlands, October 11-14, 2016, Proceedings, Part {III}},
  series       = {Lecture Notes in Computer Science},
  volume       = {9907},
  pages        = {768--784},
  publisher    = {Springer},
  year         = {2016},
  url          = {https://doi.org/10.1007/978-3-319-46487-9\_47},
  doi          = {10.1007/978-3-319-46487-9\_47},
  timestamp    = {Wed, 07 Dec 2022 23:10:23 +0100},
  biburl       = {https://dblp.org/rec/conf/eccv/EscorciaHNG16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/HeilbronEGN15,
  author       = {Fabian Caba Heilbron and
                  Victor Escorcia and
                  Bernard Ghanem and
                  Juan Carlos Niebles},
  title        = {ActivityNet: {A} large-scale video benchmark for human activity understanding},
  booktitle    = {{IEEE} Conference on Computer Vision and Pattern Recognition, {CVPR}
                  2015, Boston, MA, USA, June 7-12, 2015},
  pages        = {961--970},
  publisher    = {{IEEE} Computer Society},
  year         = {2015},
  url          = {https://doi.org/10.1109/CVPR.2015.7298698},
  doi          = {10.1109/CVPR.2015.7298698},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cvpr/HeilbronEGN15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/GhanemTNH15,
  author       = {Bernard Ghanem and
                  Ali K. Thabet and
                  Juan Carlos Niebles and
                  Fabian Caba Heilbron},
  title        = {Robust Manhattan Frame estimation from a single {RGB-D} image},
  booktitle    = {{IEEE} Conference on Computer Vision and Pattern Recognition, {CVPR}
                  2015, Boston, MA, USA, June 7-12, 2015},
  pages        = {3772--3780},
  publisher    = {{IEEE} Computer Society},
  year         = {2015},
  url          = {https://doi.org/10.1109/CVPR.2015.7299001},
  doi          = {10.1109/CVPR.2015.7299001},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cvpr/GhanemTNH15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/accv/HeilbronTNG14,
  author       = {Fabian Caba Heilbron and
                  Ali K. Thabet and
                  Juan Carlos Niebles and
                  Bernard Ghanem},
  editor       = {Daniel Cremers and
                  Ian D. Reid and
                  Hideo Saito and
                  Ming{-}Hsuan Yang},
  title        = {Camera Motion and Surrounding Scene Appearance as Context for Action
                  Recognition},
  booktitle    = {Computer Vision - {ACCV} 2014 - 12th Asian Conference on Computer
                  Vision, Singapore, Singapore, November 1-5, 2014, Revised Selected
                  Papers, Part {IV}},
  series       = {Lecture Notes in Computer Science},
  volume       = {9006},
  pages        = {583--597},
  publisher    = {Springer},
  year         = {2014},
  url          = {https://doi.org/10.1007/978-3-319-16817-3\_38},
  doi          = {10.1007/978-3-319-16817-3\_38},
  timestamp    = {Tue, 14 May 2019 10:00:50 +0200},
  biburl       = {https://dblp.org/rec/conf/accv/HeilbronTNG14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/mir/HeilbronN14,
  author       = {Fabian Caba Heilbron and
                  Juan Carlos Niebles},
  editor       = {Mohan S. Kankanhalli and
                  Stefan M. R{\"{u}}ger and
                  R. Manmatha and
                  Joemon M. Jose and
                  Keith van Rijsbergen},
  title        = {Collecting and Annotating Human Activities in Web Videos},
  booktitle    = {International Conference on Multimedia Retrieval, {ICMR} '14, Glasgow,
                  United Kingdom - April 01 - 04, 2014},
  pages        = {377},
  publisher    = {{ACM}},
  year         = {2014},
  url          = {https://doi.org/10.1145/2578726.2578775},
  doi          = {10.1145/2578726.2578775},
  timestamp    = {Thu, 15 Jul 2021 17:18:30 +0200},
  biburl       = {https://dblp.org/rec/conf/mir/HeilbronN14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics